vorbisenc.c 29 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016
  1. /********************************************************************
  2. * *
  3. * THIS FILE IS PART OF THE OggVorbis SOFTWARE CODEC SOURCE CODE. *
  4. * USE, DISTRIBUTION AND REPRODUCTION OF THIS LIBRARY SOURCE IS *
  5. * GOVERNED BY A BSD-STYLE SOURCE LICENSE INCLUDED WITH THIS SOURCE *
  6. * IN 'COPYING'. PLEASE READ THESE TERMS BEFORE DISTRIBUTING. *
  7. * *
  8. * THE OggVorbis SOURCE CODE IS (C) COPYRIGHT 1994-2002 *
  9. * by the XIPHOPHORUS Company http://www.xiph.org/ *
  10. * *
  11. ********************************************************************
  12. function: simple programmatic interface for encoder mode setup
  13. last mod: $Id: vorbisenc.c,v 1.36 2002/01/22 08:06:07 xiphmont Exp $
  14. ********************************************************************/
  15. #include <stdlib.h>
  16. #include <string.h>
  17. #include <math.h>
  18. #include <stdarg.h>
  19. #include "vorbis/codec.h"
  20. #include "vorbis/vorbisenc.h"
  21. #include "codec_internal.h"
  22. #include "registry-api.h"
  23. #include "os.h"
  24. #include "misc.h"
  25. /* careful with this; it's using static array sizing to make managing
  26. all the modes a little less annoying. If we use a residue backend
  27. with > 10 partition types, or a different division of iteration,
  28. this needs to be updated. */
  29. typedef struct {
  30. vorbis_info_residue0 *res[2];
  31. static_codebook *book_aux[2];
  32. static_codebook *books_base[5][10][3];
  33. static_codebook *books_stereo_backfill[5][10];
  34. static_codebook *books_residue_backfill[5][10][2];
  35. } vorbis_residue_template;
  36. static double stereo_threshholds[]={0.0, 2.5, 4.5, 8.5, 16.5};
  37. typedef struct vp_adjblock{
  38. int block[P_BANDS][P_LEVELS];
  39. } vp_adjblock;
  40. #include "modes/residue_44.h"
  41. #include "modes/psych_44.h"
  42. #include "modes/floor_44.h"
  43. /* a few static coder conventions */
  44. static vorbis_info_time0 _time_dummy={0};
  45. static vorbis_info_mode _mode_set_short={0,0,0,0};
  46. static vorbis_info_mode _mode_set_long={1,0,0,1};
  47. /* mapping conventions:
  48. only one submap (this would change for efficient 5.1 support for example)*/
  49. /* Four psychoacoustic profiles are used, one for each blocktype */
  50. static vorbis_info_mapping0 _mapping_set_short={
  51. 1, {0,0}, {0}, {0}, {0}, {0,1}, 0,{0},{0}};
  52. static vorbis_info_mapping0 _mapping_set_long={
  53. 1, {0,0}, {0}, {1}, {1}, {2,3}, 0,{0},{0}};
  54. static int vorbis_encode_toplevel_setup(vorbis_info *vi,int small,int large,int ch,long rate){
  55. if(vi && vi->codec_setup){
  56. codec_setup_info *ci=vi->codec_setup;
  57. vi->version=0;
  58. vi->channels=ch;
  59. vi->rate=rate;
  60. ci->blocksizes[0]=small;
  61. ci->blocksizes[1]=large;
  62. /* time mapping hooks are unused in vorbis I */
  63. ci->times=1;
  64. ci->time_type[0]=0;
  65. ci->time_param[0]=_ogg_calloc(1,sizeof(_time_dummy));
  66. memcpy(ci->time_param[0],&_time_dummy,sizeof(_time_dummy));
  67. /* by convention, two modes: one for short, one for long blocks.
  68. short block mode uses mapping sero, long block uses mapping 1 */
  69. ci->modes=2;
  70. ci->mode_param[0]=_ogg_calloc(1,sizeof(_mode_set_short));
  71. memcpy(ci->mode_param[0],&_mode_set_short,sizeof(_mode_set_short));
  72. ci->mode_param[1]=_ogg_calloc(1,sizeof(_mode_set_long));
  73. memcpy(ci->mode_param[1],&_mode_set_long,sizeof(_mode_set_long));
  74. /* by convention two mappings, both mapping type zero (polyphonic
  75. PCM), first for short, second for long blocks */
  76. ci->maps=2;
  77. ci->map_type[0]=0;
  78. ci->map_param[0]=_ogg_calloc(1,sizeof(_mapping_set_short));
  79. memcpy(ci->map_param[0],&_mapping_set_short,sizeof(_mapping_set_short));
  80. ci->map_type[1]=0;
  81. ci->map_param[1]=_ogg_calloc(1,sizeof(_mapping_set_long));
  82. memcpy(ci->map_param[1],&_mapping_set_long,sizeof(_mapping_set_long));
  83. return(0);
  84. }
  85. return(OV_EINVAL);
  86. }
  87. static int vorbis_encode_floor_setup(vorbis_info *vi,double q,int block,
  88. static_codebook ***books,
  89. vorbis_info_floor1 *in,
  90. ...){
  91. int x[11],i,k,iq=rint(q*10);
  92. vorbis_info_floor1 *f=_ogg_calloc(1,sizeof(*f));
  93. codec_setup_info *ci=vi->codec_setup;
  94. va_list ap;
  95. va_start(ap,in);
  96. for(i=0;i<11;i++)
  97. x[i]=va_arg(ap,int);
  98. va_end(ap);
  99. memcpy(f,in+x[iq],sizeof(*f));
  100. /* fill in the lowpass field, even if it's temporary */
  101. f->n=ci->blocksizes[block]>>1;
  102. /* books */
  103. {
  104. int partitions=f->partitions;
  105. int maxclass=-1;
  106. int maxbook=-1;
  107. for(i=0;i<partitions;i++)
  108. if(f->partitionclass[i]>maxclass)maxclass=f->partitionclass[i];
  109. for(i=0;i<=maxclass;i++){
  110. if(f->class_book[i]>maxbook)maxbook=f->class_book[i];
  111. f->class_book[i]+=ci->books;
  112. for(k=0;k<(1<<f->class_subs[i]);k++){
  113. if(f->class_subbook[i][k]>maxbook)maxbook=f->class_subbook[i][k];
  114. if(f->class_subbook[i][k]>=0)f->class_subbook[i][k]+=ci->books;
  115. }
  116. }
  117. for(i=0;i<=maxbook;i++)
  118. ci->book_param[ci->books++]=books[x[iq]][i];
  119. }
  120. /* for now, we're only using floor 1 */
  121. ci->floor_type[ci->floors]=1;
  122. ci->floor_param[ci->floors]=f;
  123. ci->floors++;
  124. return(0);
  125. }
  126. static int vorbis_encode_global_psych_setup(vorbis_info *vi,double q,
  127. vorbis_info_psy_global *in, ...){
  128. int i,iq=q*10;
  129. double x[11],dq;
  130. codec_setup_info *ci=vi->codec_setup;
  131. vorbis_info_psy_global *g=&ci->psy_g_param;
  132. va_list ap;
  133. va_start(ap,in);
  134. for(i=0;i<11;i++)
  135. x[i]=va_arg(ap,double);
  136. va_end(ap);
  137. if(iq==10){
  138. iq=9;
  139. dq=1.;
  140. }else{
  141. dq=q*10.-iq;
  142. }
  143. memcpy(g,in+(int)x[iq],sizeof(*g));
  144. dq=x[iq]*(1.-dq)+x[iq+1]*dq;
  145. iq=(int)dq;
  146. dq-=iq;
  147. if(dq==0 && iq>0){
  148. iq--;
  149. dq=1.;
  150. }
  151. /* interpolate the trigger threshholds */
  152. for(i=0;i<4;i++){
  153. g->preecho_thresh[i]=in[iq].preecho_thresh[i]*(1.-dq)+in[iq+1].preecho_thresh[i]*dq;
  154. g->postecho_thresh[i]=in[iq].postecho_thresh[i]*(1.-dq)+in[iq+1].postecho_thresh[i]*dq;
  155. }
  156. g->ampmax_att_per_sec=ci->hi.amplitude_track_dBpersec;
  157. return(0);
  158. }
  159. static int vorbis_encode_psyset_setup(vorbis_info *vi,int block){
  160. codec_setup_info *ci=vi->codec_setup;
  161. vorbis_info_psy *p=ci->psy_param[block];
  162. if(block>=ci->psys)
  163. ci->psys=block+1;
  164. if(!p){
  165. p=_ogg_calloc(1,sizeof(*p));
  166. ci->psy_param[block]=p;
  167. }
  168. memcpy(p,&_psy_info_template,sizeof(*p));
  169. return 0;
  170. }
  171. static int vorbis_encode_tonemask_setup(vorbis_info *vi,double q,int block,
  172. double *att,
  173. double *max,
  174. int *peaklimit_bands,
  175. vp_adjblock *in){
  176. int i,j,iq;
  177. double dq;
  178. codec_setup_info *ci=vi->codec_setup;
  179. vorbis_info_psy *p=ci->psy_param[block];
  180. iq=q*10;
  181. if(iq==10){
  182. iq=9;
  183. dq=1.;
  184. }else{
  185. dq=q*10.-iq;
  186. }
  187. p->tone_masteratt=att[iq]*(1.-dq)+att[iq+1]*dq;
  188. p->max_curve_dB=max[iq]*(1.-dq)+max[iq+1]*dq;
  189. p->curvelimitp=peaklimit_bands[iq];
  190. iq=q*5.;
  191. if(iq==5){
  192. iq=5;
  193. dq=1.;
  194. }else{
  195. dq=q*5.-iq;
  196. }
  197. for(i=0;i<P_BANDS;i++)
  198. for(j=0;j<P_LEVELS;j++)
  199. p->toneatt.block[i][j]=(j<4?4:j)*-10.+
  200. in[iq].block[i][j]*(1.-dq)+in[iq+1].block[i][j]*dq;
  201. return(0);
  202. }
  203. static int vorbis_encode_compand_setup(vorbis_info *vi,double q,int block,
  204. float in[][NOISE_COMPAND_LEVELS], ...){
  205. int i,iq=q*10;
  206. double x[11],dq;
  207. codec_setup_info *ci=vi->codec_setup;
  208. vorbis_info_psy *p=ci->psy_param[block];
  209. va_list ap;
  210. va_start(ap,in);
  211. for(i=0;i<11;i++)
  212. x[i]=va_arg(ap,double);
  213. va_end(ap);
  214. if(iq==10){
  215. iq=9;
  216. dq=1.;
  217. }else{
  218. dq=q*10.-iq;
  219. }
  220. dq=x[iq]*(1.-dq)+x[iq+1]*dq;
  221. iq=(int)dq;
  222. dq-=iq;
  223. if(dq==0 && iq>0){
  224. iq--;
  225. dq=1.;
  226. }
  227. /* interpolate the compander settings */
  228. for(i=0;i<NOISE_COMPAND_LEVELS;i++)
  229. p->noisecompand[i]=in[iq][i]*(1.-dq)+in[iq+1][i]*dq;
  230. return(0);
  231. }
  232. static int vorbis_encode_peak_setup(vorbis_info *vi,double q,int block,
  233. double *guard,
  234. double *suppress,
  235. vp_adjblock *in){
  236. int i,j,iq;
  237. double dq;
  238. codec_setup_info *ci=vi->codec_setup;
  239. vorbis_info_psy *p=ci->psy_param[block];
  240. iq=q*10;
  241. if(iq==10){
  242. iq=9;
  243. dq=1.;
  244. }else{
  245. dq=q*10.-iq;
  246. }
  247. p->peakattp=1;
  248. p->tone_guard=guard[iq]*(1.-dq)+guard[iq+1]*dq;
  249. p->tone_abs_limit=suppress[iq]*(1.-dq)+suppress[iq+1]*dq;
  250. iq=q*5.;
  251. if(iq==5){
  252. iq=5;
  253. dq=1.;
  254. }else{
  255. dq=q*5.-iq;
  256. }
  257. for(i=0;i<P_BANDS;i++)
  258. for(j=0;j<P_LEVELS;j++)
  259. p->peakatt.block[i][j]=(j<4?4:j)*-10.+
  260. in[iq].block[i][j]*(1.-dq)+in[iq+1].block[i][j]*dq;
  261. return(0);
  262. }
  263. static int vorbis_encode_noisebias_setup(vorbis_info *vi,double q,int block,
  264. double *suppress,
  265. int in[][17],int guard[33]){
  266. int i,iq=q*10;
  267. double dq;
  268. codec_setup_info *ci=vi->codec_setup;
  269. vorbis_info_psy *p=ci->psy_param[block];
  270. if(iq==10){
  271. iq=9;
  272. dq=1.;
  273. }else{
  274. dq=q*10.-iq;
  275. }
  276. p->noisemaxsupp=suppress[iq]*(1.-dq)+suppress[iq+1]*dq;
  277. p->noisewindowlomin=guard[iq*3];
  278. p->noisewindowhimin=guard[iq*3+1];
  279. p->noisewindowfixed=guard[iq*3+2];
  280. for(i=0;i<P_BANDS;i++)
  281. p->noiseoff[i]=in[iq][i]*(1.-dq)+in[iq+1][i]*dq;
  282. return(0);
  283. }
  284. static int vorbis_encode_ath_setup(vorbis_info *vi,double q,int block,
  285. float in[][27], ...){
  286. int i,iq=q*10;
  287. double x[11],dq;
  288. codec_setup_info *ci=vi->codec_setup;
  289. vorbis_info_psy *p=ci->psy_param[block];
  290. va_list ap;
  291. va_start(ap,in);
  292. for(i=0;i<11;i++)
  293. x[i]=va_arg(ap,double);
  294. va_end(ap);
  295. p->ath_adjatt=ci->hi.ath_floating_dB;
  296. p->ath_maxatt=ci->hi.ath_absolute_dB;
  297. if(iq==10){
  298. iq=9;
  299. dq=1.;
  300. }else{
  301. dq=q*10.-iq;
  302. }
  303. dq=x[iq]*(1.-dq)+x[iq+1]*dq;
  304. iq=(int)dq;
  305. dq-=iq;
  306. if(dq==0 && iq>0){
  307. iq--;
  308. dq=1.;
  309. }
  310. for(i=0;i<27;i++)
  311. p->ath[i]=in[iq][i]*(1.-dq)+in[iq+1][i]*dq;
  312. return(0);
  313. }
  314. static int book_dup_or_new(codec_setup_info *ci,static_codebook *book){
  315. int i;
  316. for(i=0;i<ci->books;i++)
  317. if(ci->book_param[i]==book)return(i);
  318. return(ci->books++);
  319. }
  320. static int vorbis_encode_residue_setup(vorbis_info *vi,double q,int block,
  321. int coupled_p,
  322. int stereo_backfill_p,
  323. int residue_backfill_p,
  324. vorbis_residue_template *in,
  325. int point_dB,
  326. double point_kHz){
  327. int i,iq=q*10;
  328. int n,k;
  329. int partition_position=0;
  330. int res_position=0;
  331. int iterations=1;
  332. int amplitude_select=0;
  333. codec_setup_info *ci=vi->codec_setup;
  334. vorbis_info_residue0 *r;
  335. vorbis_info_psy *psy=ci->psy_param[block*2];
  336. /* may be re-called due to ctl */
  337. if(ci->residue_param[block])
  338. /* free preexisting instance */
  339. residue_free_info(ci->residue_param[block],ci->residue_type[block]);
  340. r=ci->residue_param[block]=_ogg_malloc(sizeof(*r));
  341. memcpy(r,in[iq].res[block],sizeof(*r));
  342. if(ci->residues<=block)ci->residues=block+1;
  343. if(block){
  344. r->grouping=32;
  345. }else{
  346. r->grouping=16;
  347. }
  348. /* for uncoupled, we use type 1, else type 2 */
  349. if(coupled_p){
  350. ci->residue_type[block]=2;
  351. }else{
  352. ci->residue_type[block]=1;
  353. }
  354. switch(ci->residue_type[block]){
  355. case 1:
  356. n=r->end=ci->blocksizes[block?1:0]>>1; /* to be adjusted by lowpass later */
  357. partition_position=rint(point_kHz*1000./(vi->rate/2)*n/r->grouping);
  358. res_position=partition_position*r->grouping;
  359. break;
  360. case 2:
  361. n=r->end=(ci->blocksizes[block?1:0]>>1)*vi->channels; /* to be adjusted by lowpass later */
  362. partition_position=rint(point_kHz*1000./(vi->rate/2)*n/r->grouping);
  363. res_position=partition_position*r->grouping/vi->channels;
  364. break;
  365. }
  366. for(i=0;i<r->partitions;i++)
  367. if(r->blimit[i]<0)r->blimit[i]=partition_position;
  368. for(i=0;i<r->partitions;i++)
  369. for(k=0;k<3;k++)
  370. if(in[iq].books_base[point_dB][i][k])
  371. r->secondstages[i]|=(1<<k);
  372. ci->passlimit[0]=3;
  373. if(coupled_p){
  374. vorbis_info_mapping0 *map=ci->map_param[block];
  375. map->coupling_steps=1;
  376. map->coupling_mag[0]=0;
  377. map->coupling_ang[0]=1;
  378. psy->couple_pass[0].granulem=1.;
  379. psy->couple_pass[0].igranulem=1.;
  380. psy->couple_pass[0].couple_pass[0].limit=res_position;
  381. psy->couple_pass[0].couple_pass[0].outofphase_redundant_flip_p=1;
  382. psy->couple_pass[0].couple_pass[0].outofphase_requant_limit=9e10;
  383. psy->couple_pass[0].couple_pass[0].amppost_point=0;
  384. psy->couple_pass[0].couple_pass[1].limit=9999;
  385. psy->couple_pass[0].couple_pass[1].outofphase_redundant_flip_p=1;
  386. psy->couple_pass[0].couple_pass[1].outofphase_requant_limit=9e10;
  387. psy->couple_pass[0].couple_pass[1].amppost_point=
  388. stereo_threshholds[point_dB];
  389. amplitude_select=point_dB;
  390. if(stereo_backfill_p && amplitude_select){
  391. memcpy(psy->couple_pass+iterations,psy->couple_pass+iterations-1,
  392. sizeof(*psy->couple_pass));
  393. psy->couple_pass[1].couple_pass[1].amppost_point=stereo_threshholds[amplitude_select-1];
  394. ci->passlimit[1]=4;
  395. for(i=0;i<r->partitions;i++)
  396. if(in[iq].books_stereo_backfill[amplitude_select][i])
  397. r->secondstages[i]|=8;
  398. amplitude_select=amplitude_select-1;
  399. iterations++;
  400. }
  401. if(residue_backfill_p){
  402. memcpy(psy->couple_pass+iterations,psy->couple_pass+iterations-1,
  403. sizeof(*psy->couple_pass));
  404. psy->couple_pass[iterations].granulem=.333333333;
  405. psy->couple_pass[iterations].igranulem=3.;
  406. psy->couple_pass[iterations].couple_pass[0].outofphase_requant_limit=1.;
  407. psy->couple_pass[iterations].couple_pass[1].outofphase_requant_limit=1.;
  408. for(i=0;i<r->partitions;i++)
  409. if(in[iq].books_residue_backfill[amplitude_select][i][0])
  410. r->secondstages[i]|=(1<<(iterations+2));
  411. ci->passlimit[iterations]=ci->passlimit[iterations-1]+1;
  412. iterations++;
  413. memcpy(psy->couple_pass+iterations,psy->couple_pass+iterations-1,
  414. sizeof(*psy->couple_pass));
  415. psy->couple_pass[iterations].granulem=.1111111111;
  416. psy->couple_pass[iterations].igranulem=9.;
  417. psy->couple_pass[iterations].couple_pass[0].outofphase_requant_limit=.3;
  418. psy->couple_pass[iterations].couple_pass[1].outofphase_requant_limit=.3;
  419. for(i=0;i<r->partitions;i++)
  420. if(in[iq].books_residue_backfill[amplitude_select][i][1])
  421. r->secondstages[i]|=(1<<(iterations+2));
  422. ci->passlimit[iterations]=ci->passlimit[iterations-1]+1;
  423. iterations++;
  424. }
  425. ci->coupling_passes=iterations;
  426. }else{
  427. if(residue_backfill_p){
  428. for(i=0;i<r->partitions;i++){
  429. if(in[iq].books_residue_backfill[0][i][0])
  430. r->secondstages[i]|=8;
  431. if(in[iq].books_residue_backfill[0][i][1])
  432. r->secondstages[i]|=16;
  433. }
  434. ci->passlimit[1]=4;
  435. ci->passlimit[2]=5;
  436. ci->coupling_passes=3;
  437. }else
  438. ci->coupling_passes=1;
  439. }
  440. memcpy(&ci->psy_param[block*2+1]->couple_pass,
  441. &ci->psy_param[block*2]->couple_pass,
  442. sizeof(psy->couple_pass));
  443. /* fill in all the books */
  444. {
  445. int booklist=0,k;
  446. r->groupbook=ci->books;
  447. ci->book_param[ci->books++]=in[iq].book_aux[block];
  448. for(i=0;i<r->partitions;i++){
  449. for(k=0;k<3;k++){
  450. if(in[iq].books_base[point_dB][i][k]){
  451. int bookid=book_dup_or_new(ci,in[iq].books_base[point_dB][i][k]);
  452. r->booklist[booklist++]=bookid;
  453. ci->book_param[bookid]=in[iq].books_base[point_dB][i][k];
  454. }
  455. }
  456. if(coupled_p && stereo_backfill_p && point_dB &&
  457. in[iq].books_stereo_backfill[point_dB][i]){
  458. int bookid=book_dup_or_new(ci,in[iq].books_stereo_backfill[point_dB][i]);
  459. r->booklist[booklist++]=bookid;
  460. ci->book_param[bookid]=in[iq].books_stereo_backfill[point_dB][i];
  461. }
  462. if(residue_backfill_p){
  463. for(k=0;k<2;k++){
  464. if(in[iq].books_residue_backfill[amplitude_select][i][k]){
  465. int bookid=book_dup_or_new(ci,in[iq].books_residue_backfill[amplitude_select][i][k]);
  466. r->booklist[booklist++]=bookid;
  467. ci->book_param[bookid]=in[iq].books_residue_backfill[amplitude_select][i][k];
  468. }
  469. }
  470. }
  471. }
  472. }
  473. return(0);
  474. }
  475. static int vorbis_encode_lowpass_setup(vorbis_info *vi,double q,int block){
  476. int iq=q*10;
  477. double dq;
  478. double freq;
  479. codec_setup_info *ci=vi->codec_setup;
  480. vorbis_info_floor1 *f=ci->floor_param[block];
  481. vorbis_info_residue0 *r=ci->residue_param[block];
  482. int blocksize=ci->blocksizes[block]>>1;
  483. double nyq=vi->rate/2.;
  484. if(iq==10){
  485. iq=9;
  486. dq=1.;
  487. }else{
  488. dq=q*10.-iq;
  489. }
  490. freq=ci->hi.lowpass_kHz[block]*1000.;
  491. if(freq>vi->rate/2)freq=vi->rate/2;
  492. /* lowpass needs to be set in the floor and the residue. */
  493. /* in the floor, the granularity can be very fine; it doesn't alter
  494. the encoding structure, only the samples used to fit the floor
  495. approximation */
  496. f->n=freq/nyq*blocksize;
  497. /* in the residue, we're constrained, physically, by partition
  498. boundaries. We still lowpass 'wherever', but we have to round up
  499. here to next boundary, or the vorbis spec will round it *down* to
  500. previous boundary in encode/decode */
  501. if(ci->residue_type[block]==2)
  502. r->end=(int)((freq/nyq*blocksize*2)/r->grouping+.9)* /* round up only if we're well past */
  503. r->grouping;
  504. else
  505. r->end=(int)((freq/nyq*blocksize)/r->grouping+.9)* /* round up only if we're well past */
  506. r->grouping;
  507. return(0);
  508. }
  509. /* encoders will need to use vorbis_info_init beforehand and call
  510. vorbis_info clear when all done */
  511. /* two interfaces; this, more detailed one, and later a convenience
  512. layer on top */
  513. /* the final setup call */
  514. int vorbis_encode_setup_init(vorbis_info *vi){
  515. int ret=0;
  516. /*long rate=vi->rate;*/
  517. long channels=vi->channels;
  518. codec_setup_info *ci=vi->codec_setup;
  519. highlevel_encode_setup *hi=&ci->hi;
  520. ret|=vorbis_encode_floor_setup(vi,hi->base_quality_short,0,
  521. _floor_44_128_books,_floor_44_128,
  522. 0,1,1,2,2,2,2,2,2,2,2);
  523. ret|=vorbis_encode_floor_setup(vi,hi->base_quality_long,1,
  524. _floor_44_1024_books,_floor_44_1024,
  525. 0,0,0,0,0,0,0,0,0,0,0);
  526. ret|=vorbis_encode_global_psych_setup(vi,hi->trigger_quality,_psy_global_44,
  527. 0., 1., 1.5, 2., 2., 2., 2., 2., 2., 2., 2.);
  528. ret|=vorbis_encode_psyset_setup(vi,0);
  529. ret|=vorbis_encode_psyset_setup(vi,1);
  530. ret|=vorbis_encode_psyset_setup(vi,2);
  531. ret|=vorbis_encode_psyset_setup(vi,3);
  532. ret|=vorbis_encode_tonemask_setup(vi,hi->blocktype[0].tone_mask_quality,0,
  533. _psy_tone_masteratt,_psy_tone_0dB,_psy_ehmer_bandlimit,
  534. _vp_tonemask_adj_otherblock);
  535. ret|=vorbis_encode_tonemask_setup(vi,hi->blocktype[1].tone_mask_quality,1,
  536. _psy_tone_masteratt,_psy_tone_0dB,_psy_ehmer_bandlimit,
  537. _vp_tonemask_adj_otherblock);
  538. ret|=vorbis_encode_tonemask_setup(vi,hi->blocktype[2].tone_mask_quality,2,
  539. _psy_tone_masteratt,_psy_tone_0dB,_psy_ehmer_bandlimit,
  540. _vp_tonemask_adj_otherblock);
  541. ret|=vorbis_encode_tonemask_setup(vi,hi->blocktype[3].tone_mask_quality,3,
  542. _psy_tone_masteratt,_psy_tone_0dB,_psy_ehmer_bandlimit,
  543. _vp_tonemask_adj_longblock);
  544. ret|=vorbis_encode_compand_setup(vi,hi->blocktype[0].noise_compand_quality,
  545. 0,_psy_compand_44_short,
  546. 1., 1., 1.3, 1.6, 2., 2., 2., 2., 2., 2., 2.);
  547. ret|=vorbis_encode_compand_setup(vi,hi->blocktype[1].noise_compand_quality,
  548. 1,_psy_compand_44_short,
  549. 1., 1., 1.3, 1.6, 2., 2., 2., 2., 2., 2., 2.);
  550. ret|=vorbis_encode_compand_setup(vi,hi->blocktype[2].noise_compand_quality,
  551. 2,_psy_compand_44,
  552. 1., 1., 1.3, 1.6, 2., 2., 2., 2., 2., 2., 2.);
  553. ret|=vorbis_encode_compand_setup(vi,hi->blocktype[3].noise_compand_quality,
  554. 3,_psy_compand_44,
  555. 1., 1., 1.3, 1.6, 2., 2., 2., 2., 2., 2., 2.);
  556. ret|=vorbis_encode_peak_setup(vi,hi->blocktype[0].tone_peaklimit_quality,
  557. 0,_psy_tone_masterguard,_psy_tone_suppress,
  558. _vp_peakguard);
  559. ret|=vorbis_encode_peak_setup(vi,hi->blocktype[1].tone_peaklimit_quality,
  560. 1,_psy_tone_masterguard,_psy_tone_suppress,
  561. _vp_peakguard);
  562. ret|=vorbis_encode_peak_setup(vi,hi->blocktype[2].tone_peaklimit_quality,
  563. 2,_psy_tone_masterguard,_psy_tone_suppress,
  564. _vp_peakguard);
  565. ret|=vorbis_encode_peak_setup(vi,hi->blocktype[3].tone_peaklimit_quality,
  566. 3,_psy_tone_masterguard,_psy_tone_suppress,
  567. _vp_peakguard);
  568. if(hi->impulse_block_p){
  569. ret|=vorbis_encode_noisebias_setup(vi,hi->blocktype[0].noise_bias_quality,
  570. 0,_psy_noise_suppress,_psy_noisebias_impulse,
  571. _psy_noiseguards_short);
  572. }else{
  573. ret|=vorbis_encode_noisebias_setup(vi,hi->blocktype[0].noise_bias_quality,
  574. 0,_psy_noise_suppress,_psy_noisebias_other,
  575. _psy_noiseguards_short);
  576. }
  577. ret|=vorbis_encode_noisebias_setup(vi,hi->blocktype[1].noise_bias_quality,
  578. 1,_psy_noise_suppress,_psy_noisebias_other,
  579. _psy_noiseguards_short);
  580. ret|=vorbis_encode_noisebias_setup(vi,hi->blocktype[2].noise_bias_quality,
  581. 2,_psy_noise_suppress,_psy_noisebias_other,
  582. _psy_noiseguards_long);
  583. ret|=vorbis_encode_noisebias_setup(vi,hi->blocktype[3].noise_bias_quality,
  584. 3,_psy_noise_suppress,_psy_noisebias_long,
  585. _psy_noiseguards_long);
  586. ret|=vorbis_encode_ath_setup(vi,hi->blocktype[0].ath_quality,0,ATH_Bark_dB,
  587. 0., 0., 0., 0., .2, .5, 1., 1., 1.5, 2., 2.);
  588. ret|=vorbis_encode_ath_setup(vi,hi->blocktype[1].ath_quality,1,ATH_Bark_dB,
  589. 0., 0., 0., 0., .2, .5, 1., 1., 1.5, 2., 2.);
  590. ret|=vorbis_encode_ath_setup(vi,hi->blocktype[2].ath_quality,2,ATH_Bark_dB,
  591. 0., 0., 0., 0., .2, .5, 1., 1., 1.5, 2., 2.);
  592. ret|=vorbis_encode_ath_setup(vi,hi->blocktype[3].ath_quality,3,ATH_Bark_dB,
  593. 0., 0., 0., 0., .2, .5, 1., 1., 1.5, 2., 2.);
  594. if(ret){
  595. vorbis_info_clear(vi);
  596. return ret;
  597. }
  598. if(channels==2 && hi->stereo_couple_p){
  599. /* setup specific to stereo coupling */
  600. ret|=vorbis_encode_residue_setup(vi,hi->base_quality_short,0,
  601. 1, /* coupled */
  602. hi->stereo_backfill_p,
  603. hi->residue_backfill_p,
  604. _residue_template_44_stereo,
  605. hi->stereo_point_dB,
  606. hi->stereo_point_kHz[0]);
  607. ret|=vorbis_encode_residue_setup(vi,hi->base_quality_long,1,
  608. 1, /* coupled */
  609. hi->stereo_backfill_p,
  610. hi->residue_backfill_p,
  611. _residue_template_44_stereo,
  612. hi->stereo_point_dB,
  613. hi->stereo_point_kHz[1]);
  614. }else{
  615. /* setup specific to non-stereo (mono or uncoupled polyphonic)
  616. coupling */
  617. ret|=vorbis_encode_residue_setup(vi,hi->base_quality_short,0,
  618. 0, /* uncoupled */
  619. 0,
  620. hi->residue_backfill_p,
  621. _residue_template_44_uncoupled,
  622. 0,
  623. hi->stereo_point_kHz[0]); /* just
  624. used as an encoding partitioning
  625. point */
  626. ret|=vorbis_encode_residue_setup(vi,hi->base_quality_long,1,
  627. 0, /* uncoupled */
  628. 0,
  629. hi->residue_backfill_p,
  630. _residue_template_44_uncoupled,
  631. 0,
  632. hi->stereo_point_kHz[1]); /* just
  633. used as an encoding partitioning
  634. point */
  635. }
  636. ret|=vorbis_encode_lowpass_setup(vi,hi->lowpass_kHz[0],0);
  637. ret|=vorbis_encode_lowpass_setup(vi,hi->lowpass_kHz[1],1);
  638. if(ret)
  639. vorbis_info_clear(vi);
  640. return(ret);
  641. }
  642. /* this is only tuned for 44.1kHz right now. S'ok, for other rates it
  643. just doesn't guess */
  644. static double ratepch_un44[11]=
  645. {40000.,50000.,60000.,70000.,75000.,85000.,105000.,
  646. 115000.,135000.,160000.,250000.};
  647. static double ratepch_st44[11]=
  648. {32000.,40000.,48000.,56000.,64000.,
  649. 80000.,96000.,112000.,128000.,160000.,250000.};
  650. static double vbr_to_approx_bitrate(int ch,int coupled,
  651. double q,long srate){
  652. int iq=q*10.;
  653. double dq;
  654. double *r=NULL;
  655. if(iq==10){
  656. iq=9;
  657. dq=1.;
  658. }else{
  659. dq=q*10.-iq;
  660. }
  661. if(srate>42000 && srate<46000){
  662. if(coupled)
  663. r=ratepch_st44;
  664. else
  665. r=ratepch_un44;
  666. }
  667. if(r==NULL)
  668. return(-1);
  669. return((r[iq]*(1.-dq)+r[iq+1]*dq)*ch);
  670. }
  671. static double approx_bitrate_to_vbr(int ch,int coupled,
  672. double bitrate,long srate){
  673. double *r=NULL,del;
  674. int i;
  675. if(srate>42000 && srate<46000){
  676. if(coupled)
  677. r=ratepch_st44;
  678. else
  679. r=ratepch_un44;
  680. }
  681. if(r==NULL)
  682. return(-1.);
  683. bitrate/=ch;
  684. if(bitrate<=r[0])return(0.);
  685. for(i=0;i<10;i++)
  686. if(r[i]<bitrate && r[i+1]>=bitrate)break;
  687. if(i==10)return(10.);
  688. del=(bitrate-r[i])/(r[i+1]-r[i]);
  689. return((i+del)*.1);
  690. }
  691. /* only populates the high-level settings so that we can tweak with ctl before final setup */
  692. int vorbis_encode_setup_vbr(vorbis_info *vi,
  693. long channels,
  694. long rate,
  695. float base_quality){
  696. int ret=0,i,iq;
  697. double dq;
  698. codec_setup_info *ci=vi->codec_setup;
  699. highlevel_encode_setup *hi=&ci->hi;
  700. base_quality+=.0001;
  701. if(base_quality<0.)base_quality=0.;
  702. if(base_quality>.999)base_quality=.999;
  703. iq=base_quality*10;
  704. if(iq==10){
  705. iq=9;
  706. dq=1.;
  707. }else{
  708. dq=base_quality*10.-iq;
  709. }
  710. ret|=vorbis_encode_toplevel_setup(vi,256,2048,channels,rate);
  711. hi->base_quality=base_quality;
  712. hi->base_quality_short=base_quality;
  713. hi->base_quality_long=base_quality;
  714. hi->trigger_quality=base_quality;
  715. for(i=0;i<4;i++){
  716. hi->blocktype[i].tone_mask_quality=base_quality;
  717. hi->blocktype[i].tone_peaklimit_quality=base_quality;
  718. hi->blocktype[i].noise_bias_quality=base_quality;
  719. hi->blocktype[i].noise_compand_quality=base_quality;
  720. hi->blocktype[i].ath_quality=base_quality;
  721. }
  722. hi->short_block_p=1;
  723. hi->long_block_p=1;
  724. hi->impulse_block_p=1;
  725. hi->amplitude_track_dBpersec=-6.;
  726. hi->stereo_couple_p=1; /* only relevant if a two channel input */
  727. hi->stereo_backfill_p=0;
  728. hi->residue_backfill_p=0;
  729. /* set the ATH floaters */
  730. hi->ath_floating_dB=_psy_ath_floater[iq]*(1.-dq)+_psy_ath_floater[iq+1]*dq;
  731. hi->ath_absolute_dB=_psy_ath_abs[iq]*(1.-dq)+_psy_ath_abs[iq+1]*dq;
  732. /* set stereo dB and Hz */
  733. hi->stereo_point_dB=_psy_stereo_point_dB_44[iq];
  734. hi->stereo_point_kHz[0]=_psy_stereo_point_kHz_44[0][iq]*(1.-dq)+
  735. _psy_stereo_point_kHz_44[0][iq+1]*dq;
  736. hi->stereo_point_kHz[1]=_psy_stereo_point_kHz_44[1][iq]*(1.-dq)+
  737. _psy_stereo_point_kHz_44[1][iq+1]*dq;
  738. /* set lowpass */
  739. hi->lowpass_kHz[0]=
  740. hi->lowpass_kHz[1]=
  741. _psy_lowpass_44[iq]*(1.-dq)+_psy_lowpass_44[iq+1]*dq;
  742. /* set bitrate approximation */
  743. vi->bitrate_nominal=vbr_to_approx_bitrate(vi->channels,hi->stereo_couple_p,
  744. base_quality,vi->rate);
  745. vi->bitrate_lower=-1;
  746. vi->bitrate_upper=-1;
  747. vi->bitrate_window=-1;
  748. return(ret);
  749. }
  750. int vorbis_encode_init_vbr(vorbis_info *vi,
  751. long channels,
  752. long rate,
  753. float base_quality /* 0. to 1. */
  754. ){
  755. int ret=0;
  756. ret=vorbis_encode_setup_vbr(vi,channels,rate,base_quality);
  757. if(ret){
  758. vorbis_info_clear(vi);
  759. return ret;
  760. }
  761. ret=vorbis_encode_setup_init(vi);
  762. if(ret)
  763. vorbis_info_clear(vi);
  764. return(ret);
  765. }
  766. int vorbis_encode_setup_managed(vorbis_info *vi,
  767. long channels,
  768. long rate,
  769. long max_bitrate,
  770. long nominal_bitrate,
  771. long min_bitrate){
  772. double tnominal=nominal_bitrate;
  773. double approx_vbr;
  774. int ret=0;
  775. if(nominal_bitrate<=0.){
  776. if(max_bitrate>0.){
  777. nominal_bitrate=max_bitrate*.875;
  778. }else{
  779. if(min_bitrate>0.){
  780. nominal_bitrate=min_bitrate;
  781. }else{
  782. return(OV_EINVAL);
  783. }
  784. }
  785. }
  786. approx_vbr=approx_bitrate_to_vbr(channels,(channels==2),
  787. (float)nominal_bitrate,rate);
  788. if(approx_vbr<0)return(OV_EIMPL);
  789. ret=vorbis_encode_setup_vbr(vi,channels,rate,approx_vbr);
  790. if(ret){
  791. vorbis_info_clear(vi);
  792. return ret;
  793. }
  794. /* adjust to make management's life easier. Use the ctl() interface
  795. once it's implemented */
  796. {
  797. codec_setup_info *ci=vi->codec_setup;
  798. highlevel_encode_setup *hi=&ci->hi;
  799. /* backfills */
  800. hi->stereo_backfill_p=1;
  801. hi->residue_backfill_p=1;
  802. /* no impulse blocks */
  803. hi->impulse_block_p=0;
  804. /* de-rate stereo */
  805. if(hi->stereo_point_dB && hi->stereo_couple_p && channels==2){
  806. hi->stereo_point_dB++;
  807. if(hi->stereo_point_dB>3)hi->stereo_point_dB=3;
  808. }
  809. /* slug the vbr noise setting*/
  810. hi->blocktype[0].noise_bias_quality-=.1;
  811. if(hi->blocktype[0].noise_bias_quality<0.)
  812. hi->blocktype[0].noise_bias_quality=0.;
  813. hi->blocktype[1].noise_bias_quality-=.1;
  814. if(hi->blocktype[1].noise_bias_quality<0.)
  815. hi->blocktype[1].noise_bias_quality=0.;
  816. hi->blocktype[2].noise_bias_quality-=.05;
  817. if(hi->blocktype[2].noise_bias_quality<0.)
  818. hi->blocktype[2].noise_bias_quality=0.;
  819. hi->blocktype[3].noise_bias_quality-=.05;
  820. if(hi->blocktype[3].noise_bias_quality<0.)
  821. hi->blocktype[3].noise_bias_quality=0.;
  822. /* initialize management. Currently hardcoded for 44, but so is above. */
  823. memcpy(&ci->bi,&_bm_44_default,sizeof(ci->bi));
  824. ci->bi.queue_hardmin=min_bitrate;
  825. ci->bi.queue_hardmax=max_bitrate;
  826. ci->bi.queue_avgmin=tnominal;
  827. ci->bi.queue_avgmax=tnominal;
  828. /* adjust management */
  829. ci->bi.avgfloat_noise_maxval=_bm_max_noise_offset[(int)approx_vbr];
  830. }
  831. return(ret);
  832. }
  833. int vorbis_encode_init(vorbis_info *vi,
  834. long channels,
  835. long rate,
  836. long max_bitrate,
  837. long nominal_bitrate,
  838. long min_bitrate){
  839. int ret=vorbis_encode_setup_managed(vi,channels,rate,
  840. max_bitrate,
  841. nominal_bitrate,
  842. min_bitrate);
  843. if(ret){
  844. vorbis_info_clear(vi);
  845. return(ret);
  846. }
  847. ret=vorbis_encode_setup_init(vi);
  848. if(ret)
  849. vorbis_info_clear(vi);
  850. return(ret);
  851. }
  852. int vorbis_encode_ctl(vorbis_info *vi,int number,void *arg){
  853. return(OV_EIMPL);
  854. }