libavcodec/vorbis_enc.c

   1 /*
   2  * copyright (c) 2006 Oded Shimon <ods15@ods15.dyndns.org>
   3  *
   4  * This file is part of FFmpeg.
   5  *
   6  * FFmpeg is free software; you can redistribute it and/or
   7  * modify it under the terms of the GNU Lesser General Public
   8  * License as published by the Free Software Foundation; either
   9  * version 2.1 of the License, or (at your option) any later version.
  10  *
  11  * FFmpeg is distributed in the hope that it will be useful,
  12  * but WITHOUT ANY WARRANTY; without even the implied warranty of
  13  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
  14  * Lesser General Public License for more details.
  15  *
  16  * You should have received a copy of the GNU Lesser General Public
  17  * License along with FFmpeg; if not, write to the Free Software
  18  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  19  */
  20
  21 /**
  22  * @file vorbis_enc.c
  23  * Native Vorbis encoder.
  24  * @author Oded Shimon <ods15@ods15.dyndns.org>
  25  */
  26
  27 #include <float.h>
  28 #include "avcodec.h"
  29 #include "dsputil.h"
  30 #include "vorbis.h"
  31 #include "vorbis_enc_data.h"
  32
  33 #undef NDEBUG
  34 #include <assert.h>
  35
  36 typedef struct {
  37     int nentries;
  38     uint8_t * lens;
  39     uint32_t * codewords;
  40     int ndimentions;
  41     float min;
  42     float delta;
  43     int seq_p;
  44     int lookup;
  45     int * quantlist;
  46     float * dimentions;
  47     float * pow2;
  48 } codebook_t;
  49
  50 typedef struct {
  51     int dim;
  52     int subclass;
  53     int masterbook;
  54     int * books;
  55 } floor_class_t;
  56
  57 typedef struct {
  58     int partitions;
  59     int * partition_to_class;
  60     int nclasses;
  61     floor_class_t * classes;
  62     int multiplier;
  63     int rangebits;
  64     int values;
  65     floor1_entry_t * list;
  66 } floor_t;
  67
  68 typedef struct {
  69     int type;
  70     int begin;
  71     int end;
  72     int partition_size;
  73     int classifications;
  74     int classbook;
  75     int8_t (*books)[8];
  76     float (*maxes)[2];
  77 } residue_t;
  78
  79 typedef struct {
  80     int submaps;
  81     int * mux;
  82     int * floor;
  83     int * residue;
  84     int coupling_steps;
  85     int * magnitude;
  86     int * angle;
  87 } mapping_t;
  88
  89 typedef struct {
  90     int blockflag;
  91     int mapping;
  92 } vorbis_mode_t;
  93
  94 typedef struct {
  95     int channels;
  96     int sample_rate;
  97     int log2_blocksize[2];
  98     MDCTContext mdct[2];
  99     const float * win[2];
 100     int have_saved;
 101     float * saved;
 102     float * samples;
 103     float * floor; // also used for tmp values for mdct
 104     float * coeffs; // also used for residue after floor
 105     float quality;
 106
 107     int ncodebooks;
 108     codebook_t * codebooks;
 109
 110     int nfloors;
 111     floor_t * floors;
 112
 113     int nresidues;
 114     residue_t * residues;
 115
 116     int nmappings;
 117     mapping_t * mappings;
 118
 119     int nmodes;
 120     vorbis_mode_t * modes;
 121
 122     int64_t sample_count;
 123 } venc_context_t;
 124
 125 typedef struct {
 126     int total;
 127     int total_pos;
 128     int pos;
 129     uint8_t * buf_ptr;
 130 } PutBitContext;
 131
 132 static inline void init_put_bits(PutBitContext * pb, uint8_t * buf, int buffer_len) {
 133     pb->total = buffer_len * 8;
 134     pb->total_pos = 0;
 135     pb->pos = 0;
 136     pb->buf_ptr = buf;
 137 }
 138
 139 static void put_bits(PutBitContext * pb, int bits, uint64_t val) {
 140     if ((pb->total_pos += bits) >= pb->total) return;
 141     if (!bits) return;
 142     if (pb->pos) {
 143         if (pb->pos > bits) {
 144             *pb->buf_ptr |= val << (8 - pb->pos);
 145             pb->pos -= bits;
 146             bits = 0;
 147         } else {
 148             *pb->buf_ptr++ |= (val << (8 - pb->pos)) & 0xFF;
 149             val >>= pb->pos;
 150             bits -= pb->pos;
 151             pb->pos = 0;
 152         }
 153     }
 154     for (; bits >= 8; bits -= 8) {
 155         *pb->buf_ptr++ = val & 0xFF;
 156         val >>= 8;
 157     }
 158     if (bits) {
 159         *pb->buf_ptr = val;
 160         pb->pos = 8 - bits;
 161     }
 162 }
 163
 164 static inline void flush_put_bits(PutBitContext * pb) {
 165 }
 166
 167 static inline int put_bits_count(PutBitContext * pb) {
 168     return pb->total_pos;
 169 }
 170
 171 static inline void put_codeword(PutBitContext * pb, codebook_t * cb, int entry) {
 172     assert(entry >= 0);
 173     assert(entry < cb->nentries);
 174     assert(cb->lens[entry]);
 175     put_bits(pb, cb->lens[entry], cb->codewords[entry]);
 176 }
 177
 178 static int cb_lookup_vals(int lookup, int dimentions, int entries) {
 179     if      (lookup == 1) return ff_vorbis_nth_root(entries, dimentions);
 180     else if (lookup == 2) return dimentions * entries;
 181     return 0;
 182 }
 183
 184 static void ready_codebook(codebook_t * cb) {
 185     int i;
 186
 187     ff_vorbis_len2vlc(cb->lens, cb->codewords, cb->nentries);
 188
 189     if (!cb->lookup)
 190         cb->pow2 = cb->dimentions = NULL;
 191     else {
 192         int vals = cb_lookup_vals(cb->lookup, cb->ndimentions, cb->nentries);
 193         cb->dimentions = av_malloc(sizeof(float) * cb->nentries * cb->ndimentions);
 194         cb->pow2 = av_mallocz(sizeof(float) * cb->nentries);
 195         for (i = 0; i < cb->nentries; i++) {
 196             float last = 0;
 197             int j;
 198             int div = 1;
 199             for (j = 0; j < cb->ndimentions; j++) {
 200                 int off;
 201                 if (cb->lookup == 1)
 202                     off = (i / div) % vals; // lookup type 1
 203                 else
 204                     off = i * cb->ndimentions + j; // lookup type 2
 205
 206                 cb->dimentions[i * cb->ndimentions + j] = last + cb->min + cb->quantlist[off] * cb->delta;
 207                 if (cb->seq_p)
 208                     last = cb->dimentions[i * cb->ndimentions + j];
 209                 cb->pow2[i] += cb->dimentions[i * cb->ndimentions + j]*cb->dimentions[i * cb->ndimentions + j];
 210                 div *= vals;
 211             }
 212             cb->pow2[i] /= 2.;
 213         }
 214     }
 215 }
 216
 217 static void ready_residue(residue_t * rc, venc_context_t * venc) {
 218     int i;
 219     assert(rc->type == 2);
 220     rc->maxes = av_mallocz(sizeof(float[2]) * rc->classifications);
 221     for (i = 0; i < rc->classifications; i++) {
 222         int j;
 223         codebook_t * cb;
 224         for (j = 0; j < 8; j++)
 225             if (rc->books[i][j] != -1) break;
 226         if (j == 8) continue; // zero
 227         cb = &venc->codebooks[rc->books[i][j]];
 228         assert(cb->ndimentions >= 2);
 229         assert(cb->lookup);
 230
 231         for (j = 0; j < cb->nentries; j++) {
 232             float a;
 233             if (!cb->lens[j]) continue;
 234             a = fabs(cb->dimentions[j * cb->ndimentions]);
 235             if (a > rc->maxes[i][0])
 236                 rc->maxes[i][0] = a;
 237             a = fabs(cb->dimentions[j * cb->ndimentions + 1]);
 238             if (a > rc->maxes[i][1])
 239                 rc->maxes[i][1] = a;
 240         }
 241     }
 242     // small bias
 243     for (i = 0; i < rc->classifications; i++) {
 244         rc->maxes[i][0] += 0.8;
 245         rc->maxes[i][1] += 0.8;
 246     }
 247 }
 248
 249 static void create_vorbis_context(venc_context_t * venc, AVCodecContext * avccontext) {
 250     floor_t * fc;
 251     residue_t * rc;
 252     mapping_t * mc;
 253     int i, book;
 254
 255     venc->channels = avccontext->channels;
 256     venc->sample_rate = avccontext->sample_rate;
 257     venc->log2_blocksize[0] = venc->log2_blocksize[1] = 11;
 258
 259     venc->ncodebooks = sizeof(cvectors)/sizeof(cvectors[0]);
 260     venc->codebooks = av_malloc(sizeof(codebook_t) * venc->ncodebooks);
 261
 262     // codebook 0..14 - floor1 book, values 0..255
 263     // codebook 15 residue masterbook
 264     // codebook 16..29 residue
 265     for (book = 0; book < venc->ncodebooks; book++) {
 266         codebook_t * cb = &venc->codebooks[book];
 267         int vals;
 268         cb->ndimentions = cvectors[book].dim;
 269         cb->nentries = cvectors[book].real_len;
 270         cb->min = cvectors[book].min;
 271         cb->delta = cvectors[book].delta;
 272         cb->lookup = cvectors[book].lookup;
 273         cb->seq_p = 0;
 274
 275         cb->lens = av_malloc(sizeof(uint8_t) * cb->nentries);
 276         cb->codewords = av_malloc(sizeof(uint32_t) * cb->nentries);
 277         memcpy(cb->lens, cvectors[book].clens, cvectors[book].len);
 278         memset(cb->lens + cvectors[book].len, 0, cb->nentries - cvectors[book].len);
 279
 280         if (cb->lookup) {
 281             vals = cb_lookup_vals(cb->lookup, cb->ndimentions, cb->nentries);
 282             cb->quantlist = av_malloc(sizeof(int) * vals);
 283             for (i = 0; i < vals; i++)
 284                 cb->quantlist[i] = cvectors[book].quant[i];
 285         } else {
 286             cb->quantlist = NULL;
 287         }
 288         ready_codebook(cb);
 289     }
 290
 291     venc->nfloors = 1;
 292     venc->floors = av_malloc(sizeof(floor_t) * venc->nfloors);
 293
 294     // just 1 floor
 295     fc = &venc->floors[0];
 296     fc->partitions = 8;
 297     fc->partition_to_class = av_malloc(sizeof(int) * fc->partitions);
 298     fc->nclasses = 0;
 299     for (i = 0; i < fc->partitions; i++) {
 300         static const int a[] = {0,1,2,2,3,3,4,4};
 301         fc->partition_to_class[i] = a[i];
 302         fc->nclasses = FFMAX(fc->nclasses, fc->partition_to_class[i]);
 303     }
 304     fc->nclasses++;
 305     fc->classes = av_malloc(sizeof(floor_class_t) * fc->nclasses);
 306     for (i = 0; i < fc->nclasses; i++) {
 307         floor_class_t * c = &fc->classes[i];
 308         int j, books;
 309         c->dim = floor_classes[i].dim;
 310         c->subclass = floor_classes[i].subclass;
 311         c->masterbook = floor_classes[i].masterbook;
 312         books = (1 << c->subclass);
 313         c->books = av_malloc(sizeof(int) * books);
 314         for (j = 0; j < books; j++)
 315             c->books[j] = floor_classes[i].nbooks[j];
 316     }
 317     fc->multiplier = 2;
 318     fc->rangebits = venc->log2_blocksize[0] - 1;
 319
 320     fc->values = 2;
 321     for (i = 0; i < fc->partitions; i++)
 322         fc->values += fc->classes[fc->partition_to_class[i]].dim;
 323
 324     fc->list = av_malloc(sizeof(floor1_entry_t) * fc->values);
 325     fc->list[0].x = 0;
 326     fc->list[1].x = 1 << fc->rangebits;
 327     for (i = 2; i < fc->values; i++) {
 328         static const int a[] = {
 329              93, 23,372,  6, 46,186,750, 14, 33, 65,
 330             130,260,556,  3, 10, 18, 28, 39, 55, 79,
 331             111,158,220,312,464,650,850
 332         };
 333         fc->list[i].x = a[i - 2];
 334     }
 335     ff_vorbis_ready_floor1_list(fc->list, fc->values);
 336
 337     venc->nresidues = 1;
 338     venc->residues = av_malloc(sizeof(residue_t) * venc->nresidues);
 339
 340     // single residue
 341     rc = &venc->residues[0];
 342     rc->type = 2;
 343     rc->begin = 0;
 344     rc->end = 1600;
 345     rc->partition_size = 32;
 346     rc->classifications = 10;
 347     rc->classbook = 15;
 348     rc->books = av_malloc(sizeof(*rc->books) * rc->classifications);
 349     {
 350         static const int8_t a[10][8] = {
 351             { -1, -1, -1, -1, -1, -1, -1, -1, },
 352             { -1, -1, 16, -1, -1, -1, -1, -1, },
 353             { -1, -1, 17, -1, -1, -1, -1, -1, },
 354             { -1, -1, 18, -1, -1, -1, -1, -1, },
 355             { -1, -1, 19, -1, -1, -1, -1, -1, },
 356             { -1, -1, 20, -1, -1, -1, -1, -1, },
 357             { -1, -1, 21, -1, -1, -1, -1, -1, },
 358             { 22, 23, -1, -1, -1, -1, -1, -1, },
 359             { 24, 25, -1, -1, -1, -1, -1, -1, },
 360             { 26, 27, 28, -1, -1, -1, -1, -1, },
 361         };
 362         memcpy(rc->books, a, sizeof a);
 363     }
 364     ready_residue(rc, venc);
 365
 366     venc->nmappings = 1;
 367     venc->mappings = av_malloc(sizeof(mapping_t) * venc->nmappings);
 368
 369     // single mapping
 370     mc = &venc->mappings[0];
 371     mc->submaps = 1;
 372     mc->mux = av_malloc(sizeof(int) * venc->channels);
 373     for (i = 0; i < venc->channels; i++)
 374         mc->mux[i] = 0;
 375     mc->floor = av_malloc(sizeof(int) * mc->submaps);
 376     mc->residue = av_malloc(sizeof(int) * mc->submaps);
 377     for (i = 0; i < mc->submaps; i++) {
 378         mc->floor[i] = 0;
 379         mc->residue[i] = 0;
 380     }
 381     mc->coupling_steps = venc->channels == 2 ? 1 : 0;
 382     mc->magnitude = av_malloc(sizeof(int) * mc->coupling_steps);
 383     mc->angle = av_malloc(sizeof(int) * mc->coupling_steps);
 384     if (mc->coupling_steps) {
 385         mc->magnitude[0] = 0;
 386         mc->angle[0] = 1;
 387     }
 388
 389     venc->nmodes = 1;
 390     venc->modes = av_malloc(sizeof(vorbis_mode_t) * venc->nmodes);
 391
 392     // single mode
 393     venc->modes[0].blockflag = 0;
 394     venc->modes[0].mapping = 0;
 395
 396     venc->have_saved = 0;
 397     venc->saved = av_malloc(sizeof(float) * venc->channels * (1 << venc->log2_blocksize[1]) / 2);
 398     venc->samples = av_malloc(sizeof(float) * venc->channels * (1 << venc->log2_blocksize[1]));
 399     venc->floor = av_malloc(sizeof(float) * venc->channels * (1 << venc->log2_blocksize[1]) / 2);
 400     venc->coeffs = av_malloc(sizeof(float) * venc->channels * (1 << venc->log2_blocksize[1]) / 2);
 401
 402     venc->win[0] = ff_vorbis_vwin[venc->log2_blocksize[0] - 6];
 403     venc->win[1] = ff_vorbis_vwin[venc->log2_blocksize[1] - 6];
 404
 405     ff_mdct_init(&venc->mdct[0], venc->log2_blocksize[0], 0);
 406     ff_mdct_init(&venc->mdct[1], venc->log2_blocksize[1], 0);
 407 }
 408
 409 static void put_float(PutBitContext * pb, float f) {
 410     int exp, mant;
 411     uint32_t res = 0;
 412     mant = (int)ldexp(frexp(f, &exp), 20);
 413     exp += 788 - 20;
 414     if (mant < 0) { res |= (1 << 31); mant = -mant; }
 415     res |= mant | (exp << 21);
 416     put_bits(pb, 32, res);
 417 }
 418
 419 static void put_codebook_header(PutBitContext * pb, codebook_t * cb) {
 420     int i;
 421     int ordered = 0;
 422
 423     put_bits(pb, 24, 0x564342); //magic
 424     put_bits(pb, 16, cb->ndimentions);
 425     put_bits(pb, 24, cb->nentries);
 426
 427     for (i = 1; i < cb->nentries; i++)
 428         if (cb->lens[i] < cb->lens[i-1]) break;
 429     if (i == cb->nentries)
 430         ordered = 1;
 431
 432     put_bits(pb, 1, ordered);
 433     if (ordered) {
 434         int len = cb->lens[0];
 435         put_bits(pb, 5, len - 1);
 436         i = 0;
 437         while (i < cb->nentries) {
 438             int j;
 439             for (j = 0; j+i < cb->nentries; j++)
 440                 if (cb->lens[j+i] != len) break;
 441             put_bits(pb, ilog(cb->nentries - i), j);
 442             i += j;
 443             len++;
 444         }
 445     } else {
 446         int sparse = 0;
 447         for (i = 0; i < cb->nentries; i++)
 448             if (!cb->lens[i]) break;
 449         if (i != cb->nentries)
 450             sparse = 1;
 451         put_bits(pb, 1, sparse);
 452
 453         for (i = 0; i < cb->nentries; i++) {
 454             if (sparse) put_bits(pb, 1, !!cb->lens[i]);
 455             if (cb->lens[i]) put_bits(pb, 5, cb->lens[i] - 1);
 456         }
 457     }
 458
 459     put_bits(pb, 4, cb->lookup);
 460     if (cb->lookup) {
 461         int tmp = cb_lookup_vals(cb->lookup, cb->ndimentions, cb->nentries);
 462         int bits = ilog(cb->quantlist[0]);
 463
 464         for (i = 1; i < tmp; i++)
 465             bits = FFMAX(bits, ilog(cb->quantlist[i]));
 466
 467         put_float(pb, cb->min);
 468         put_float(pb, cb->delta);
 469
 470         put_bits(pb, 4, bits - 1);
 471         put_bits(pb, 1, cb->seq_p);
 472
 473         for (i = 0; i < tmp; i++)
 474             put_bits(pb, bits, cb->quantlist[i]);
 475     }
 476 }
 477
 478 static void put_floor_header(PutBitContext * pb, floor_t * fc) {
 479     int i;
 480
 481     put_bits(pb, 16, 1); // type, only floor1 is supported
 482
 483     put_bits(pb, 5, fc->partitions);
 484
 485     for (i = 0; i < fc->partitions; i++)
 486         put_bits(pb, 4, fc->partition_to_class[i]);
 487
 488     for (i = 0; i < fc->nclasses; i++) {
 489         int j, books;
 490
 491         put_bits(pb, 3, fc->classes[i].dim - 1);
 492         put_bits(pb, 2, fc->classes[i].subclass);
 493
 494         if (fc->classes[i].subclass)
 495             put_bits(pb, 8, fc->classes[i].masterbook);
 496
 497         books = (1 << fc->classes[i].subclass);
 498
 499         for (j = 0; j < books; j++)
 500             put_bits(pb, 8, fc->classes[i].books[j] + 1);
 501     }
 502
 503     put_bits(pb, 2, fc->multiplier - 1);
 504     put_bits(pb, 4, fc->rangebits);
 505
 506     for (i = 2; i < fc->values; i++)
 507         put_bits(pb, fc->rangebits, fc->list[i].x);
 508 }
 509
 510 static void put_residue_header(PutBitContext * pb, residue_t * rc) {
 511     int i;
 512
 513     put_bits(pb, 16, rc->type);
 514
 515     put_bits(pb, 24, rc->begin);
 516     put_bits(pb, 24, rc->end);
 517     put_bits(pb, 24, rc->partition_size - 1);
 518     put_bits(pb, 6, rc->classifications - 1);
 519     put_bits(pb, 8, rc->classbook);
 520
 521     for (i = 0; i < rc->classifications; i++) {
 522         int j, tmp = 0;
 523         for (j = 0; j < 8; j++)
 524             tmp |= (rc->books[i][j] != -1) << j;
 525
 526         put_bits(pb, 3, tmp & 7);
 527         put_bits(pb, 1, tmp > 7);
 528
 529         if (tmp > 7)
 530             put_bits(pb, 5, tmp >> 3);
 531     }
 532
 533     for (i = 0; i < rc->classifications; i++) {
 534         int j;
 535         for (j = 0; j < 8; j++)
 536             if (rc->books[i][j] != -1)
 537                 put_bits(pb, 8, rc->books[i][j]);
 538     }
 539 }
 540
 541 static int put_main_header(venc_context_t * venc, uint8_t ** out) {
 542     int i;
 543     PutBitContext pb;
 544     uint8_t buffer[50000] = {0}, * p = buffer;
 545     int buffer_len = sizeof buffer;
 546     int len, hlens[3];
 547
 548     // identification header
 549     init_put_bits(&pb, p, buffer_len);
 550     put_bits(&pb, 8, 1); //magic
 551     for (i = 0; "vorbis"[i]; i++)
 552         put_bits(&pb, 8, "vorbis"[i]);
 553     put_bits(&pb, 32, 0); // version
 554     put_bits(&pb, 8, venc->channels);
 555     put_bits(&pb, 32, venc->sample_rate);
 556     put_bits(&pb, 32, 0); // bitrate
 557     put_bits(&pb, 32, 0); // bitrate
 558     put_bits(&pb, 32, 0); // bitrate
 559     put_bits(&pb, 4, venc->log2_blocksize[0]);
 560     put_bits(&pb, 4, venc->log2_blocksize[1]);
 561     put_bits(&pb, 1, 1); // framing
 562
 563     flush_put_bits(&pb);
 564     hlens[0] = (put_bits_count(&pb) + 7) / 8;
 565     buffer_len -= hlens[0];
 566     p += hlens[0];
 567
 568     // comment header
 569     init_put_bits(&pb, p, buffer_len);
 570     put_bits(&pb, 8, 3); //magic
 571     for (i = 0; "vorbis"[i]; i++)
 572         put_bits(&pb, 8, "vorbis"[i]);
 573     put_bits(&pb, 32, 0); // vendor length TODO
 574     put_bits(&pb, 32, 0); // amount of comments
 575     put_bits(&pb, 1, 1); // framing
 576
 577     flush_put_bits(&pb);
 578     hlens[1] = (put_bits_count(&pb) + 7) / 8;
 579     buffer_len -= hlens[1];
 580     p += hlens[1];
 581
 582     // setup header
 583     init_put_bits(&pb, p, buffer_len);
 584     put_bits(&pb, 8, 5); //magic
 585     for (i = 0; "vorbis"[i]; i++)
 586         put_bits(&pb, 8, "vorbis"[i]);
 587
 588     // codebooks
 589     put_bits(&pb, 8, venc->ncodebooks - 1);
 590     for (i = 0; i < venc->ncodebooks; i++)
 591         put_codebook_header(&pb, &venc->codebooks[i]);
 592
 593     // time domain, reserved, zero
 594     put_bits(&pb, 6, 0);
 595     put_bits(&pb, 16, 0);
 596
 597     // floors
 598     put_bits(&pb, 6, venc->nfloors - 1);
 599     for (i = 0; i < venc->nfloors; i++)
 600         put_floor_header(&pb, &venc->floors[i]);
 601
 602     // residues
 603     put_bits(&pb, 6, venc->nresidues - 1);
 604     for (i = 0; i < venc->nresidues; i++)
 605         put_residue_header(&pb, &venc->residues[i]);
 606
 607     // mappings
 608     put_bits(&pb, 6, venc->nmappings - 1);
 609     for (i = 0; i < venc->nmappings; i++) {
 610         mapping_t * mc = &venc->mappings[i];
 611         int j;
 612         put_bits(&pb, 16, 0); // mapping type
 613
 614         put_bits(&pb, 1, mc->submaps > 1);
 615         if (mc->submaps > 1)
 616             put_bits(&pb, 4, mc->submaps - 1);
 617
 618         put_bits(&pb, 1, !!mc->coupling_steps);
 619         if (mc->coupling_steps) {
 620             put_bits(&pb, 8, mc->coupling_steps - 1);
 621             for (j = 0; j < mc->coupling_steps; j++) {
 622                 put_bits(&pb, ilog(venc->channels - 1), mc->magnitude[j]);
 623                 put_bits(&pb, ilog(venc->channels - 1), mc->angle[j]);
 624             }
 625         }
 626
 627         put_bits(&pb, 2, 0); // reserved
 628
 629         if (mc->submaps > 1)
 630             for (j = 0; j < venc->channels; j++)
 631                 put_bits(&pb, 4, mc->mux[j]);
 632
 633         for (j = 0; j < mc->submaps; j++) {
 634             put_bits(&pb, 8, 0); // reserved time configuration
 635             put_bits(&pb, 8, mc->floor[j]);
 636             put_bits(&pb, 8, mc->residue[j]);
 637         }
 638     }
 639
 640     // modes
 641     put_bits(&pb, 6, venc->nmodes - 1);
 642     for (i = 0; i < venc->nmodes; i++) {
 643         put_bits(&pb, 1, venc->modes[i].blockflag);
 644         put_bits(&pb, 16, 0); // reserved window type
 645         put_bits(&pb, 16, 0); // reserved transform type
 646         put_bits(&pb, 8, venc->modes[i].mapping);
 647     }
 648
 649     put_bits(&pb, 1, 1); // framing
 650
 651     flush_put_bits(&pb);
 652     hlens[2] = (put_bits_count(&pb) + 7) / 8;
 653
 654     len = hlens[0] + hlens[1] + hlens[2];
 655     p = *out = av_mallocz(64 + len + len/255);
 656
 657     *p++ = 2;
 658     p += av_xiphlacing(p, hlens[0]);
 659     p += av_xiphlacing(p, hlens[1]);
 660     buffer_len = 0;
 661     for (i = 0; i < 3; i++) {
 662         memcpy(p, buffer + buffer_len, hlens[i]);
 663         p += hlens[i];
 664         buffer_len += hlens[i];
 665     }
 666
 667     return p - *out;
 668 }
 669
 670 static float get_floor_average(floor_t * fc, float * coeffs, int i) {
 671     int begin = fc->list[fc->list[FFMAX(i-1, 0)].sort].x;
 672     int end   = fc->list[fc->list[FFMIN(i+1, fc->values - 1)].sort].x;
 673     int j;
 674     float average = 0;
 675
 676     for (j = begin; j < end; j++)
 677         average += fabs(coeffs[j]);
 678     return average / (end - begin);
 679 }
 680
 681 static void floor_fit(venc_context_t * venc, floor_t * fc, float * coeffs, uint_fast16_t * posts, int samples) {
 682     int range = 255 / fc->multiplier + 1;
 683     int i;
 684     float tot_average = 0.;
 685     float averages[fc->values];
 686     for (i = 0; i < fc->values; i++){
 687         averages[i] = get_floor_average(fc, coeffs, i);
 688         tot_average += averages[i];
 689     }
 690     tot_average /= fc->values;
 691     tot_average /= venc->quality;
 692
 693     for (i = 0; i < fc->values; i++) {
 694         int position = fc->list[fc->list[i].sort].x;
 695         float average = averages[i];
 696         int j;
 697
 698         average *= pow(tot_average / average, 0.5) * pow(1.25, position/200.); // MAGIC!
 699         for (j = 0; j < range - 1; j++)
 700             if (ff_vorbis_floor1_inverse_db_table[j * fc->multiplier] > average) break;
 701         posts[fc->list[i].sort] = j;
 702     }
 703 }
 704
 705 static int render_point(int x0, int y0, int x1, int y1, int x) {
 706     return y0 +  (x - x0) * (y1 - y0) / (x1 - x0);
 707 }
 708
 709 static void floor_encode(venc_context_t * venc, floor_t * fc, PutBitContext * pb, uint_fast16_t * posts, float * floor, int samples) {
 710     int range = 255 / fc->multiplier + 1;
 711     int coded[fc->values]; // first 2 values are unused
 712     int i, counter;
 713
 714     put_bits(pb, 1, 1); // non zero
 715     put_bits(pb, ilog(range - 1), posts[0]);
 716     put_bits(pb, ilog(range - 1), posts[1]);
 717     coded[0] = coded[1] = 1;
 718
 719     for (i = 2; i < fc->values; i++) {
 720         int predicted = render_point(fc->list[fc->list[i].low].x,
 721                                      posts[fc->list[i].low],
 722                                      fc->list[fc->list[i].high].x,
 723                                      posts[fc->list[i].high],
 724                                      fc->list[i].x);
 725         int highroom = range - predicted;
 726         int lowroom = predicted;
 727         int room = FFMIN(highroom, lowroom);
 728         if (predicted == posts[i]) {
 729             coded[i] = 0; // must be used later as flag!
 730             continue;
 731         } else {
 732             if (!coded[fc->list[i].low ]) coded[fc->list[i].low ] = -1;
 733             if (!coded[fc->list[i].high]) coded[fc->list[i].high] = -1;
 734         }
 735         if (posts[i] > predicted) {
 736             if (posts[i] - predicted > room)
 737                 coded[i] = posts[i] - predicted + lowroom;
 738             else
 739                 coded[i] = (posts[i] - predicted) << 1;
 740         } else {
 741             if (predicted - posts[i] > room)
 742                 coded[i] = predicted - posts[i] + highroom - 1;
 743             else
 744                 coded[i] = ((predicted - posts[i]) << 1) - 1;
 745         }
 746     }
 747
 748     counter = 2;
 749     for (i = 0; i < fc->partitions; i++) {
 750         floor_class_t * c = &fc->classes[fc->partition_to_class[i]];
 751         int k, cval = 0, csub = 1<<c->subclass;
 752         if (c->subclass) {
 753             codebook_t * book = &venc->codebooks[c->masterbook];
 754             int cshift = 0;
 755             for (k = 0; k < c->dim; k++) {
 756                 int l;
 757                 for (l = 0; l < csub; l++) {
 758                     int maxval = 1;
 759                     if (c->books[l] != -1)
 760                         maxval = venc->codebooks[c->books[l]].nentries;
 761                     // coded could be -1, but this still works, cause that is 0
 762                     if (coded[counter + k] < maxval) break;
 763                 }
 764                 assert(l != csub);
 765                 cval |= l << cshift;
 766                 cshift += c->subclass;
 767             }
 768             put_codeword(pb, book, cval);
 769         }
 770         for (k = 0; k < c->dim; k++) {
 771             int book = c->books[cval & (csub-1)];
 772             int entry = coded[counter++];
 773             cval >>= c->subclass;
 774             if (book == -1) continue;
 775             if (entry == -1) entry = 0;
 776             put_codeword(pb, &venc->codebooks[book], entry);
 777         }
 778     }
 779
 780     ff_vorbis_floor1_render_list(fc->list, fc->values, posts, coded, fc->multiplier, floor, samples);
 781 }
 782
 783 static float * put_vector(codebook_t * book, PutBitContext * pb, float * num) {
 784     int i, entry = -1;
 785     float distance = FLT_MAX;
 786     assert(book->dimentions);
 787     for (i = 0; i < book->nentries; i++) {
 788         float * vec = book->dimentions + i * book->ndimentions, d = book->pow2[i];
 789         int j;
 790         if (!book->lens[i]) continue;
 791         for (j = 0; j < book->ndimentions; j++)
 792             d -= vec[j] * num[j];
 793         if (distance > d) {
 794             entry = i;
 795             distance = d;
 796         }
 797     }
 798     put_codeword(pb, book, entry);
 799     return &book->dimentions[entry * book->ndimentions];
 800 }
 801
 802 static void residue_encode(venc_context_t * venc, residue_t * rc, PutBitContext * pb, float * coeffs, int samples, int real_ch) {
 803     int pass, i, j, p, k;
 804     int psize = rc->partition_size;
 805     int partitions = (rc->end - rc->begin) / psize;
 806     int channels = (rc->type == 2) ? 1 : real_ch;
 807     int classes[channels][partitions];
 808     int classwords = venc->codebooks[rc->classbook].ndimentions;
 809
 810     assert(rc->type == 2);
 811     assert(real_ch == 2);
 812     for (p = 0; p < partitions; p++) {
 813         float max1 = 0., max2 = 0.;
 814         int s = rc->begin + p * psize;
 815         for (k = s; k < s + psize; k += 2) {
 816             max1 = FFMAX(max1, fabs(coeffs[          k / real_ch]));
 817             max2 = FFMAX(max2, fabs(coeffs[samples + k / real_ch]));
 818         }
 819
 820         for (i = 0; i < rc->classifications - 1; i++) {
 821             if (max1 < rc->maxes[i][0] && max2 < rc->maxes[i][1]) break;
 822         }
 823         classes[0][p] = i;
 824     }
 825
 826     for (pass = 0; pass < 8; pass++) {
 827         p = 0;
 828         while (p < partitions) {
 829             if (pass == 0)
 830                 for (j = 0; j < channels; j++) {
 831                     codebook_t * book = &venc->codebooks[rc->classbook];
 832                     int entry = 0;
 833                     for (i = 0; i < classwords; i++) {
 834                         entry *= rc->classifications;
 835                         entry += classes[j][p + i];
 836                     }
 837                     put_codeword(pb, book, entry);
 838                 }
 839             for (i = 0; i < classwords && p < partitions; i++, p++) {
 840                 for (j = 0; j < channels; j++) {
 841                     int nbook = rc->books[classes[j][p]][pass];
 842                     codebook_t * book = &venc->codebooks[nbook];
 843                     float * buf = coeffs + samples*j + rc->begin + p*psize;
 844                     if (nbook == -1) continue;
 845
 846                     assert(rc->type == 0 || rc->type == 2);
 847                     assert(!(psize % book->ndimentions));
 848
 849                     if (rc->type == 0) {
 850                         for (k = 0; k < psize; k += book->ndimentions) {
 851                             float * a = put_vector(book, pb, &buf[k]);
 852                             int l;
 853                             for (l = 0; l < book->ndimentions; l++)
 854                                 buf[k + l] -= a[l];
 855                         }
 856                     } else {
 857                         int s = rc->begin + p * psize, a1, b1;
 858                         a1 = (s % real_ch) * samples;
 859                         b1 =  s / real_ch;
 860                         s = real_ch * samples;
 861                         for (k = 0; k < psize; k += book->ndimentions) {
 862                             int dim, a2 = a1, b2 = b1;
 863                             float vec[book->ndimentions], * pv = vec;
 864                             for (dim = book->ndimentions; dim--; ) {
 865                                 *pv++ = coeffs[a2 + b2];
 866                                 if ((a2 += samples) == s) {
 867                                     a2=0;
 868                                     b2++;
 869                                 }
 870                             }
 871                             pv = put_vector(book, pb, vec);
 872                             for (dim = book->ndimentions; dim--; ) {
 873                                 coeffs[a1 + b1] -= *pv++;
 874                                 if ((a1 += samples) == s) {
 875                                     a1=0;
 876                                     b1++;
 877                                 }
 878                             }
 879                         }
 880                     }
 881                 }
 882             }
 883         }
 884     }
 885 }
 886
 887 static int apply_window_and_mdct(venc_context_t * venc, signed short * audio, int samples) {
 888     int i, j, channel;
 889     const float * win = venc->win[0];
 890     int window_len = 1 << (venc->log2_blocksize[0] - 1);
 891     float n = (float)(1 << venc->log2_blocksize[0]) / 4.;
 892     // FIXME use dsp
 893
 894     if (!venc->have_saved && !samples) return 0;
 895
 896     if (venc->have_saved) {
 897         for (channel = 0; channel < venc->channels; channel++) {
 898             memcpy(venc->samples + channel*window_len*2, venc->saved + channel*window_len, sizeof(float)*window_len);
 899         }
 900     } else {
 901         for (channel = 0; channel < venc->channels; channel++) {
 902             memset(venc->samples + channel*window_len*2, 0, sizeof(float)*window_len);
 903         }
 904     }
 905
 906     if (samples) {
 907         for (channel = 0; channel < venc->channels; channel++) {
 908             float * offset = venc->samples + channel*window_len*2 + window_len;
 909             j = channel;
 910             for (i = 0; i < samples; i++, j += venc->channels)
 911                 offset[i] = -audio[j] / 32768. / n * win[window_len - i - 1]; //FIXME find out why the sign has to be fliped
 912         }
 913     } else {
 914         for (channel = 0; channel < venc->channels; channel++) {
 915             memset(venc->samples + channel*window_len*2 + window_len, 0, sizeof(float)*window_len);
 916         }
 917     }
 918
 919     for (channel = 0; channel < venc->channels; channel++) {
 920         ff_mdct_calc(&venc->mdct[0], venc->coeffs + channel*window_len, venc->samples + channel*window_len*2);
 921     }
 922
 923     if (samples) {
 924         for (channel = 0; channel < venc->channels; channel++) {
 925             float * offset = venc->saved + channel*window_len;
 926             j = channel;
 927             for (i = 0; i < samples; i++, j += venc->channels)
 928                 offset[i] = -audio[j] / 32768. / n * win[i]; //FIXME find out why the sign has to be fliped
 929         }
 930         venc->have_saved = 1;
 931     } else {
 932         venc->have_saved = 0;
 933     }
 934     return 1;
 935 }
 936
 937 static av_cold int vorbis_encode_init(AVCodecContext * avccontext)
 938 {
 939     venc_context_t * venc = avccontext->priv_data;
 940
 941     if (avccontext->channels != 2) {
 942         av_log(avccontext, AV_LOG_ERROR, "Current FFmpeg Vorbis encoder only supports 2 channels.\n");
 943         return -1;
 944     }
 945
 946     create_vorbis_context(venc, avccontext);
 947
 948     if (avccontext->flags & CODEC_FLAG_QSCALE)
 949         venc->quality = avccontext->global_quality / (float)FF_QP2LAMBDA / 10.;
 950     else
 951         venc->quality = 1.;
 952     venc->quality *= venc->quality;
 953
 954     avccontext->extradata_size = put_main_header(venc, (uint8_t**)&avccontext->extradata);
 955
 956     avccontext->frame_size = 1 << (venc->log2_blocksize[0] - 1);
 957
 958     avccontext->coded_frame = avcodec_alloc_frame();
 959     avccontext->coded_frame->key_frame = 1;
 960
 961     return 0;
 962 }
 963
 964 static int vorbis_encode_frame(AVCodecContext * avccontext, unsigned char * packets, int buf_size, void *data)
 965 {
 966     venc_context_t * venc = avccontext->priv_data;
 967     signed short * audio = data;
 968     int samples = data ? avccontext->frame_size : 0;
 969     vorbis_mode_t * mode;
 970     mapping_t * mapping;
 971     PutBitContext pb;
 972     int i;
 973
 974     if (!apply_window_and_mdct(venc, audio, samples)) return 0;
 975     samples = 1 << (venc->log2_blocksize[0] - 1);
 976
 977     init_put_bits(&pb, packets, buf_size);
 978
 979     put_bits(&pb, 1, 0); // magic bit
 980
 981     put_bits(&pb, ilog(venc->nmodes - 1), 0); // 0 bits, the mode
 982
 983     mode = &venc->modes[0];
 984     mapping = &venc->mappings[mode->mapping];
 985     if (mode->blockflag) {
 986         put_bits(&pb, 1, 0);
 987         put_bits(&pb, 1, 0);
 988     }
 989
 990     for (i = 0; i < venc->channels; i++) {
 991         floor_t * fc = &venc->floors[mapping->floor[mapping->mux[i]]];
 992         uint_fast16_t posts[fc->values];
 993         floor_fit(venc, fc, &venc->coeffs[i * samples], posts, samples);
 994         floor_encode(venc, fc, &pb, posts, &venc->floor[i * samples], samples);
 995     }
 996
 997     for (i = 0; i < venc->channels * samples; i++) {
 998         venc->coeffs[i] /= venc->floor[i];
 999     }
1000
1001     for (i = 0; i < mapping->coupling_steps; i++) {
1002         float * mag = venc->coeffs + mapping->magnitude[i] * samples;
1003         float * ang = venc->coeffs + mapping->angle[i] * samples;
1004         int j;
1005         for (j = 0; j < samples; j++) {
1006             float a = ang[j];
1007             ang[j] -= mag[j];
1008             if (mag[j] > 0) ang[j] = -ang[j];
1009             if (ang[j] < 0) mag[j] = a;
1010         }
1011     }
1012
1013     residue_encode(venc, &venc->residues[mapping->residue[mapping->mux[0]]], &pb, venc->coeffs, samples, venc->channels);
1014
1015     avccontext->coded_frame->pts = venc->sample_count;
1016     venc->sample_count += avccontext->frame_size;
1017     flush_put_bits(&pb);
1018     return (put_bits_count(&pb) + 7) / 8;
1019 }
1020
1021
1022 static av_cold int vorbis_encode_close(AVCodecContext * avccontext)
1023 {
1024     venc_context_t * venc = avccontext->priv_data;
1025     int i;
1026
1027     if (venc->codebooks)
1028         for (i = 0; i < venc->ncodebooks; i++) {
1029             av_freep(&venc->codebooks[i].lens);
1030             av_freep(&venc->codebooks[i].codewords);
1031             av_freep(&venc->codebooks[i].quantlist);
1032             av_freep(&venc->codebooks[i].dimentions);
1033             av_freep(&venc->codebooks[i].pow2);
1034         }
1035     av_freep(&venc->codebooks);
1036
1037     if (venc->floors)
1038         for (i = 0; i < venc->nfloors; i++) {
1039             int j;
1040             if (venc->floors[i].classes)
1041                 for (j = 0; j < venc->floors[i].nclasses; j++)
1042                     av_freep(&venc->floors[i].classes[j].books);
1043             av_freep(&venc->floors[i].classes);
1044             av_freep(&venc->floors[i].partition_to_class);
1045             av_freep(&venc->floors[i].list);
1046         }
1047     av_freep(&venc->floors);
1048
1049     if (venc->residues)
1050         for (i = 0; i < venc->nresidues; i++) {
1051             av_freep(&venc->residues[i].books);
1052             av_freep(&venc->residues[i].maxes);
1053         }
1054     av_freep(&venc->residues);
1055
1056     if (venc->mappings)
1057         for (i = 0; i < venc->nmappings; i++) {
1058             av_freep(&venc->mappings[i].mux);
1059             av_freep(&venc->mappings[i].floor);
1060             av_freep(&venc->mappings[i].residue);
1061             av_freep(&venc->mappings[i].magnitude);
1062             av_freep(&venc->mappings[i].angle);
1063         }
1064     av_freep(&venc->mappings);
1065
1066     av_freep(&venc->modes);
1067
1068     av_freep(&venc->saved);
1069     av_freep(&venc->samples);
1070     av_freep(&venc->floor);
1071     av_freep(&venc->coeffs);
1072
1073     ff_mdct_end(&venc->mdct[0]);
1074     ff_mdct_end(&venc->mdct[1]);
1075
1076     av_freep(&avccontext->coded_frame);
1077     av_freep(&avccontext->extradata);
1078
1079     return 0 ;
1080 }
1081
1082 AVCodec vorbis_encoder = {
1083     "vorbis",
1084     CODEC_TYPE_AUDIO,
1085     CODEC_ID_VORBIS,
1086     sizeof(venc_context_t),
1087     vorbis_encode_init,
1088     vorbis_encode_frame,
1089     vorbis_encode_close,
1090     .capabilities= CODEC_CAP_DELAY,
1091     .sample_fmts = (enum SampleFormat[]){SAMPLE_FMT_S16,SAMPLE_FMT_NONE},
1092     .long_name = NULL_IF_CONFIG_SMALL("Vorbis"),
1093 };