patch-libavcodec_aacenc_is_c 7.4 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149
  1. $OpenBSD: patch-libavcodec_aacenc_is_c,v 1.5 2016/01/18 15:34:45 ajacoutot Exp $
  2. aacenc_is: ignore PNS band types
  3. aacenc_is: take absolute coefficient value upon energy calculations
  4. AAC encoder: Extensive improvements
  5. aacenc_is: rename variable
  6. AAC encoder: in IS, fix index of sf_idx, band_type
  7. AAC encoder: fix I/S relative error evaluation
  8. AAC encoder: encode out-of-phase I/S efficiently
  9. avcodec/aacenc_is: replace pow(x, 0.75) by x/sqrtf(sqrtf(x))
  10. AAC encoder: use signed coeffs when measuring IS energy
  11. --- libavcodec/aacenc_is.c.orig Wed Jan 13 15:27:48 2016
  12. +++ libavcodec/aacenc_is.c Sun Jan 17 21:03:19 2016
  13. @@ -45,11 +45,16 @@ struct AACISError ff_aac_is_encoding_err(AACEncContext
  14. float dist1 = 0.0f, dist2 = 0.0f;
  15. struct AACISError is_error = {0};
  16. + if (ener01 <= 0 || ener0 <= 0) {
  17. + is_error.pass = 0;
  18. + return is_error;
  19. + }
  20. +
  21. for (w2 = 0; w2 < sce0->ics.group_len[w]; w2++) {
  22. FFPsyBand *band0 = &s->psy.ch[s->cur_channel+0].psy_bands[(w+w2)*16+g];
  23. FFPsyBand *band1 = &s->psy.ch[s->cur_channel+1].psy_bands[(w+w2)*16+g];
  24. - int is_band_type, is_sf_idx = FFMAX(1, sce0->sf_idx[(w+w2)*16+g]-4);
  25. - float e01_34 = phase*pow(ener1/ener0, 3.0/4.0);
  26. + int is_band_type, is_sf_idx = FFMAX(1, sce0->sf_idx[w*16+g]-4);
  27. + float e01_34 = phase*pos_pow34(ener1/ener0);
  28. float maxval, dist_spec_err = 0.0f;
  29. float minthr = FFMIN(band0->threshold, band1->threshold);
  30. for (i = 0; i < sce0->ics.swb_sizes[g]; i++)
  31. @@ -61,17 +66,17 @@ struct AACISError ff_aac_is_encoding_err(AACEncContext
  32. is_band_type = find_min_book(maxval, is_sf_idx);
  33. dist1 += quantize_band_cost(s, &L[start + (w+w2)*128], L34,
  34. sce0->ics.swb_sizes[g],
  35. - sce0->sf_idx[(w+w2)*16+g],
  36. - sce0->band_type[(w+w2)*16+g],
  37. - s->lambda / band0->threshold, INFINITY, NULL, 0);
  38. + sce0->sf_idx[w*16+g],
  39. + sce0->band_type[w*16+g],
  40. + s->lambda / band0->threshold, INFINITY, NULL, NULL, 0);
  41. dist1 += quantize_band_cost(s, &R[start + (w+w2)*128], R34,
  42. sce1->ics.swb_sizes[g],
  43. - sce1->sf_idx[(w+w2)*16+g],
  44. - sce1->band_type[(w+w2)*16+g],
  45. - s->lambda / band1->threshold, INFINITY, NULL, 0);
  46. + sce1->sf_idx[w*16+g],
  47. + sce1->band_type[w*16+g],
  48. + s->lambda / band1->threshold, INFINITY, NULL, NULL, 0);
  49. dist2 += quantize_band_cost(s, IS, I34, sce0->ics.swb_sizes[g],
  50. is_sf_idx, is_band_type,
  51. - s->lambda / minthr, INFINITY, NULL, 0);
  52. + s->lambda / minthr, INFINITY, NULL, NULL, 0);
  53. for (i = 0; i < sce0->ics.swb_sizes[g]; i++) {
  54. dist_spec_err += (L34[i] - I34[i])*(L34[i] - I34[i]);
  55. dist_spec_err += (R34[i] - I34[i]*e01_34)*(R34[i] - I34[i]*e01_34);
  56. @@ -82,9 +87,10 @@ struct AACISError ff_aac_is_encoding_err(AACEncContext
  57. is_error.pass = dist2 <= dist1;
  58. is_error.phase = phase;
  59. - is_error.error = fabsf(dist1 - dist2);
  60. + is_error.error = dist2 - dist1;
  61. is_error.dist1 = dist1;
  62. is_error.dist2 = dist2;
  63. + is_error.ener01 = ener01;
  64. return is_error;
  65. }
  66. @@ -93,42 +99,58 @@ void ff_aac_search_for_is(AACEncContext *s, AVCodecCon
  67. {
  68. SingleChannelElement *sce0 = &cpe->ch[0];
  69. SingleChannelElement *sce1 = &cpe->ch[1];
  70. - int start = 0, count = 0, w, w2, g, i;
  71. + int start = 0, count = 0, w, w2, g, i, prev_sf1 = -1, prev_bt = -1, prev_is = 0;
  72. const float freq_mult = avctx->sample_rate/(1024.0f/sce0->ics.num_windows)/2.0f;
  73. + uint8_t nextband1[128];
  74. if (!cpe->common_window)
  75. return;
  76. + /** Scout out next nonzero bands */
  77. + ff_init_nextband_map(sce1, nextband1);
  78. +
  79. for (w = 0; w < sce0->ics.num_windows; w += sce0->ics.group_len[w]) {
  80. start = 0;
  81. for (g = 0; g < sce0->ics.num_swb; g++) {
  82. if (start*freq_mult > INT_STEREO_LOW_LIMIT*(s->lambda/170.0f) &&
  83. cpe->ch[0].band_type[w*16+g] != NOISE_BT && !cpe->ch[0].zeroes[w*16+g] &&
  84. - cpe->ch[1].band_type[w*16+g] != NOISE_BT && !cpe->ch[1].zeroes[w*16+g]) {
  85. - float ener0 = 0.0f, ener1 = 0.0f, ener01 = 0.0f;
  86. - struct AACISError ph_err1, ph_err2, *erf;
  87. + cpe->ch[1].band_type[w*16+g] != NOISE_BT && !cpe->ch[1].zeroes[w*16+g] &&
  88. + ff_sfdelta_can_remove_band(sce1, nextband1, prev_sf1, w*16+g)) {
  89. + float ener0 = 0.0f, ener1 = 0.0f, ener01 = 0.0f, ener01p = 0.0f;
  90. + struct AACISError ph_err1, ph_err2, *best;
  91. for (w2 = 0; w2 < sce0->ics.group_len[w]; w2++) {
  92. for (i = 0; i < sce0->ics.swb_sizes[g]; i++) {
  93. - float coef0 = sce0->pcoeffs[start+(w+w2)*128+i];
  94. - float coef1 = sce1->pcoeffs[start+(w+w2)*128+i];
  95. + float coef0 = sce0->coeffs[start+(w+w2)*128+i];
  96. + float coef1 = sce1->coeffs[start+(w+w2)*128+i];
  97. ener0 += coef0*coef0;
  98. ener1 += coef1*coef1;
  99. ener01 += (coef0 + coef1)*(coef0 + coef1);
  100. + ener01p += (coef0 - coef1)*(coef0 - coef1);
  101. }
  102. }
  103. ph_err1 = ff_aac_is_encoding_err(s, cpe, start, w, g,
  104. - ener0, ener1, ener01, 0, -1);
  105. + ener0, ener1, ener01p, 0, -1);
  106. ph_err2 = ff_aac_is_encoding_err(s, cpe, start, w, g,
  107. ener0, ener1, ener01, 0, +1);
  108. - erf = ph_err1.error < ph_err2.error ? &ph_err1 : &ph_err2;
  109. - if (erf->pass) {
  110. + best = (ph_err1.pass && ph_err1.error < ph_err2.error) ? &ph_err1 : &ph_err2;
  111. + if (best->pass) {
  112. cpe->is_mask[w*16+g] = 1;
  113. - cpe->ch[0].is_ener[w*16+g] = sqrt(ener0/ener01);
  114. + cpe->ms_mask[w*16+g] = 0;
  115. + cpe->ch[0].is_ener[w*16+g] = sqrt(ener0 / best->ener01);
  116. cpe->ch[1].is_ener[w*16+g] = ener0/ener1;
  117. - cpe->ch[1].band_type[w*16+g] = erf->phase ? INTENSITY_BT : INTENSITY_BT2;
  118. + cpe->ch[1].band_type[w*16+g] = (best->phase > 0) ? INTENSITY_BT : INTENSITY_BT2;
  119. + if (prev_is && prev_bt != cpe->ch[1].band_type[w*16+g]) {
  120. + /** Flip M/S mask and pick the other CB, since it encodes more efficiently */
  121. + cpe->ms_mask[w*16+g] = 1;
  122. + cpe->ch[1].band_type[w*16+g] = (best->phase > 0) ? INTENSITY_BT2 : INTENSITY_BT;
  123. + }
  124. + prev_bt = cpe->ch[1].band_type[w*16+g];
  125. count++;
  126. }
  127. }
  128. + if (!sce1->zeroes[w*16+g] && sce1->band_type[w*16+g] < RESERVED_BT)
  129. + prev_sf1 = sce1->sf_idx[w*16+g];
  130. + prev_is = cpe->is_mask[w*16+g];
  131. start += sce0->ics.swb_sizes[g];
  132. }
  133. }