intrax8.c 24 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764
  1. /*
  2. * This file is part of FFmpeg.
  3. *
  4. * FFmpeg is free software; you can redistribute it and/or
  5. * modify it under the terms of the GNU Lesser General Public
  6. * License as published by the Free Software Foundation; either
  7. * version 2.1 of the License, or (at your option) any later version.
  8. *
  9. * FFmpeg is distributed in the hope that it will be useful,
  10. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  11. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  12. * Lesser General Public License for more details.
  13. *
  14. * You should have received a copy of the GNU Lesser General Public
  15. * License along with FFmpeg; if not, write to the Free Software
  16. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  17. */
  18. /**
  19. * @file libavcodec/intrax8.c
  20. * @brief IntraX8 (J-Frame) subdecoder, used by WMV2 and VC-1
  21. */
  22. #include "avcodec.h"
  23. #include "bitstream.h"
  24. #include "mpegvideo.h"
  25. #include "msmpeg4data.h"
  26. #include "intrax8huf.h"
  27. #include "intrax8.h"
  28. #define MAX_TABLE_DEPTH(table_bits, max_bits) ((max_bits+table_bits-1)/table_bits)
  29. #define DC_VLC_BITS 9
  30. #define AC_VLC_BITS 9
  31. #define OR_VLC_BITS 7
  32. #define DC_VLC_MTD MAX_TABLE_DEPTH(DC_VLC_BITS, MAX_DC_VLC_BITS)
  33. #define AC_VLC_MTD MAX_TABLE_DEPTH(AC_VLC_BITS, MAX_AC_VLC_BITS)
  34. #define OR_VLC_MTD MAX_TABLE_DEPTH(OR_VLC_BITS, MAX_OR_VLC_BITS)
  35. static VLC j_ac_vlc[2][2][8]; //[quant<13],[intra/inter],[select]
  36. static VLC j_dc_vlc[2][8]; //[quant], [select]
  37. static VLC j_orient_vlc[2][4]; //[quant], [select]
  38. static av_cold void x8_vlc_init(void){
  39. int i;
  40. #define init_ac_vlc(dst,src) \
  41. init_vlc(&dst, \
  42. AC_VLC_BITS,77, \
  43. &src[1],4,2, \
  44. &src[0],4,2, \
  45. 1)
  46. //set ac tables
  47. for(i=0;i<8;i++){
  48. init_ac_vlc( j_ac_vlc[0][0][i], x8_ac0_highquant_table[i][0] );
  49. init_ac_vlc( j_ac_vlc[0][1][i], x8_ac1_highquant_table[i][0] );
  50. init_ac_vlc( j_ac_vlc[1][0][i], x8_ac0_lowquant_table [i][0] );
  51. init_ac_vlc( j_ac_vlc[1][1][i], x8_ac1_lowquant_table [i][0] );
  52. }
  53. #undef init_ac_vlc
  54. //set dc tables
  55. #define init_dc_vlc(dst,src) \
  56. init_vlc(&dst, \
  57. DC_VLC_BITS,34, \
  58. &src[1],4,2, \
  59. &src[0],4,2, \
  60. 1);
  61. for(i=0;i<8;i++){
  62. init_dc_vlc( j_dc_vlc[0][i], x8_dc_highquant_table[i][0]);
  63. init_dc_vlc( j_dc_vlc[1][i], x8_dc_lowquant_table [i][0]);
  64. }
  65. #undef init_dc_vlc
  66. //set orient tables
  67. #define init_or_vlc(dst,src) \
  68. init_vlc(&dst, \
  69. OR_VLC_BITS,12, \
  70. &src[1],4,2, \
  71. &src[0],4,2, \
  72. 1);
  73. for(i=0;i<2;i++){
  74. init_or_vlc( j_orient_vlc[0][i], x8_orient_highquant_table[i][0]);
  75. }
  76. for(i=0;i<4;i++){
  77. init_or_vlc( j_orient_vlc[1][i], x8_orient_lowquant_table [i][0])
  78. }
  79. }
  80. #undef init_or_vlc
  81. static void x8_reset_vlc_tables(IntraX8Context * w){
  82. memset(w->j_dc_vlc,0,sizeof(w->j_dc_vlc));
  83. memset(w->j_ac_vlc,0,sizeof(w->j_ac_vlc));
  84. w->j_orient_vlc=NULL;
  85. }
  86. static inline void x8_select_ac_table(IntraX8Context * const w , int mode){
  87. MpegEncContext * const s= w->s;
  88. int table_index;
  89. assert(mode<4);
  90. if( w->j_ac_vlc[mode] ) return;
  91. table_index = get_bits(&s->gb, 3);
  92. w->j_ac_vlc[mode] = &j_ac_vlc[w->quant<13][mode>>1][table_index];//2 modes use same tables
  93. assert(w->j_ac_vlc[mode]);
  94. }
  95. static inline int x8_get_orient_vlc(IntraX8Context * w){
  96. MpegEncContext * const s= w->s;
  97. int table_index;
  98. if(!w->j_orient_vlc ){
  99. table_index = get_bits(&s->gb, 1+(w->quant<13) );
  100. w->j_orient_vlc = &j_orient_vlc[w->quant<13][table_index];
  101. }
  102. assert(w->j_orient_vlc);
  103. assert(w->j_orient_vlc->table);
  104. return get_vlc2(&s->gb, w->j_orient_vlc->table, OR_VLC_BITS, OR_VLC_MTD);
  105. }
  106. #define extra_bits(eb) (eb)
  107. #define extra_run (0xFF<<8)
  108. #define extra_level (0x00<<8)
  109. #define run_offset(r) ((r)<<16)
  110. #define level_offset(l) ((l)<<24)
  111. static const uint32_t ac_decode_table[]={
  112. /*46*/ extra_bits(3) | extra_run | run_offset(16) | level_offset( 0),
  113. /*47*/ extra_bits(3) | extra_run | run_offset(24) | level_offset( 0),
  114. /*48*/ extra_bits(2) | extra_run | run_offset( 4) | level_offset( 1),
  115. /*49*/ extra_bits(3) | extra_run | run_offset( 8) | level_offset( 1),
  116. /*50*/ extra_bits(5) | extra_run | run_offset(32) | level_offset( 0),
  117. /*51*/ extra_bits(4) | extra_run | run_offset(16) | level_offset( 1),
  118. /*52*/ extra_bits(2) | extra_level | run_offset( 0) | level_offset( 4),
  119. /*53*/ extra_bits(2) | extra_level | run_offset( 0) | level_offset( 8),
  120. /*54*/ extra_bits(2) | extra_level | run_offset( 0) | level_offset(12),
  121. /*55*/ extra_bits(3) | extra_level | run_offset( 0) | level_offset(16),
  122. /*56*/ extra_bits(3) | extra_level | run_offset( 0) | level_offset(24),
  123. /*57*/ extra_bits(2) | extra_level | run_offset( 1) | level_offset( 3),
  124. /*58*/ extra_bits(3) | extra_level | run_offset( 1) | level_offset( 7),
  125. /*59*/ extra_bits(2) | extra_run | run_offset(16) | level_offset( 0),
  126. /*60*/ extra_bits(2) | extra_run | run_offset(20) | level_offset( 0),
  127. /*61*/ extra_bits(2) | extra_run | run_offset(24) | level_offset( 0),
  128. /*62*/ extra_bits(2) | extra_run | run_offset(28) | level_offset( 0),
  129. /*63*/ extra_bits(4) | extra_run | run_offset(32) | level_offset( 0),
  130. /*64*/ extra_bits(4) | extra_run | run_offset(48) | level_offset( 0),
  131. /*65*/ extra_bits(2) | extra_run | run_offset( 4) | level_offset( 1),
  132. /*66*/ extra_bits(3) | extra_run | run_offset( 8) | level_offset( 1),
  133. /*67*/ extra_bits(4) | extra_run | run_offset(16) | level_offset( 1),
  134. /*68*/ extra_bits(2) | extra_level | run_offset( 0) | level_offset( 4),
  135. /*69*/ extra_bits(3) | extra_level | run_offset( 0) | level_offset( 8),
  136. /*70*/ extra_bits(4) | extra_level | run_offset( 0) | level_offset(16),
  137. /*71*/ extra_bits(2) | extra_level | run_offset( 1) | level_offset( 3),
  138. /*72*/ extra_bits(3) | extra_level | run_offset( 1) | level_offset( 7),
  139. };
  140. //extra_bits = 3bits; extra_run/level = 1 bit; run_offset = 6bits; level_offset = 5 bits;
  141. #undef extra_bits
  142. #undef extra_run
  143. #undef extra_level
  144. #undef run_offset
  145. #undef level_offset
  146. static void x8_get_ac_rlf(IntraX8Context * const w, const int mode,
  147. int * const run, int * const level, int * const final){
  148. MpegEncContext * const s= w->s;
  149. int i,e;
  150. // x8_select_ac_table(w,mode);
  151. i = get_vlc2(&s->gb, w->j_ac_vlc[mode]->table, AC_VLC_BITS, AC_VLC_MTD);
  152. if(i<46){ //[0-45]
  153. int t,l;
  154. if(i<0){
  155. (*level)=(*final)=//prevent 'may be used unilitialized'
  156. (*run)=64;//this would cause error exit in the ac loop
  157. return;
  158. }
  159. (*final) = t = (i>22);
  160. i-=23*t;
  161. /*
  162. i== 0-15 r=0-15 l=0 ;r=i& %01111
  163. i==16-19 r=0-3 l=1 ;r=i& %00011
  164. i==20-21 r=0-1 l=2 ;r=i& %00001
  165. i==22 r=0 l=3 ;r=i& %00000
  166. l=lut_l[i/2]={0,0,0,0,0,0,0,0,1,1,2,3}[i>>1];// 11 10'01 01'00 00'00 00'00 00'00 00 => 0xE50000
  167. t=lut_mask[l]={0x0f,0x03,0x01,0x00}[l]; as i<256 the higher bits do not matter */
  168. l=(0xE50000>>(i&(0x1E)))&3;/*0x1E or (~1) or ((i>>1)<<1)*/
  169. t=(0x01030F>>(l<<3));
  170. (*run) = i&t;
  171. (*level) = l;
  172. }else if(i<73){//[46-72]
  173. uint32_t sm;
  174. uint32_t mask;
  175. i-=46;
  176. sm=ac_decode_table[i];
  177. e=get_bits(&s->gb,sm&0xF);sm>>=8;//3bits
  178. mask=sm&0xff;sm>>=8; //1bit
  179. (*run) =(sm&0xff) + (e&( mask));//6bits
  180. (*level)=(sm>>8) + (e&(~mask));//5bits
  181. (*final)=i>(58-46);
  182. }else if(i<75){//[73-74]
  183. static const uint8_t crazy_mix_runlevel[32]={
  184. 0x22,0x32,0x33,0x53,0x23,0x42,0x43,0x63,
  185. 0x24,0x52,0x34,0x73,0x25,0x62,0x44,0x83,
  186. 0x26,0x72,0x35,0x54,0x27,0x82,0x45,0x64,
  187. 0x28,0x92,0x36,0x74,0x29,0xa2,0x46,0x84};
  188. (*final)=!(i&1);
  189. e=get_bits(&s->gb,5);//get the extra bits
  190. (*run) =crazy_mix_runlevel[e]>>4;
  191. (*level)=crazy_mix_runlevel[e]&0x0F;
  192. }else{
  193. (*level)=get_bits( &s->gb, 7-3*(i&1));
  194. (*run) =get_bits( &s->gb, 6);
  195. (*final)=get_bits1(&s->gb);
  196. }
  197. return;
  198. }
  199. //static const uint8_t dc_extra_sbits[] ={0, 1,1, 1,1, 2,2, 3,3, 4,4, 5,5, 6,6, 7,7 };
  200. static const uint8_t dc_index_offset[] ={ 0, 1,2, 3,4, 5,7, 9,13, 17,25, 33,49, 65,97, 129,193};
  201. static int x8_get_dc_rlf(IntraX8Context * const w,int const mode, int * const level, int * const final){
  202. MpegEncContext * const s= w->s;
  203. int i,e,c;
  204. assert(mode<3);
  205. if( !w->j_dc_vlc[mode] ) {
  206. int table_index;
  207. table_index = get_bits(&s->gb, 3);
  208. //4 modes, same table
  209. w->j_dc_vlc[mode]= &j_dc_vlc[w->quant<13][table_index];
  210. }
  211. assert(w->j_dc_vlc);
  212. assert(w->j_dc_vlc[mode]->table);
  213. i=get_vlc2(&s->gb, w->j_dc_vlc[mode]->table, DC_VLC_BITS, DC_VLC_MTD);
  214. /*(i>=17) {i-=17;final=1;}*/
  215. c= i>16;
  216. (*final)=c;
  217. i-=17*c;
  218. if(i<=0){
  219. (*level)=0;
  220. return -i;
  221. }
  222. c=(i+1)>>1;//hackish way to calculate dc_extra_sbits[]
  223. c-=c>1;
  224. e=get_bits(&s->gb,c);//get the extra bits
  225. i=dc_index_offset[i]+(e>>1);
  226. e= -(e & 1);//0,0xffffff
  227. (*level)= (i ^ e) - e;// (i^0)-0 , (i^0xff)-(-1)
  228. return 0;
  229. }
  230. //end of huffman
  231. static int x8_setup_spatial_predictor(IntraX8Context * const w, const int chroma){
  232. MpegEncContext * const s= w->s;
  233. int range;
  234. int sum;
  235. int quant;
  236. s->dsp.x8_setup_spatial_compensation(s->dest[chroma], s->edge_emu_buffer,
  237. s->current_picture.linesize[chroma>0],
  238. &range, &sum, w->edges);
  239. if(chroma){
  240. w->orient=w->chroma_orient;
  241. quant=w->quant_dc_chroma;
  242. }else{
  243. quant=w->quant;
  244. }
  245. w->flat_dc=0;
  246. if(range < quant || range < 3){
  247. w->orient=0;
  248. if(range < 3){//yep you read right, a +-1 idct error may break decoding!
  249. w->flat_dc=1;
  250. sum+=9;
  251. w->predicted_dc = (sum*6899)>>17;//((1<<17)+9)/(8+8+1+2)=6899
  252. }
  253. }
  254. if(chroma)
  255. return 0;
  256. assert(w->orient < 3);
  257. if(range < 2*w->quant){
  258. if( (w->edges&3) == 0){
  259. if(w->orient==1) w->orient=11;
  260. if(w->orient==2) w->orient=10;
  261. }else{
  262. w->orient=0;
  263. }
  264. w->raw_orient=0;
  265. }else{
  266. static const uint8_t prediction_table[3][12]={
  267. {0,8,4, 10,11, 2,6,9,1,3,5,7},
  268. {4,0,8, 11,10, 3,5,2,6,9,1,7},
  269. {8,0,4, 10,11, 1,7,2,6,9,3,5}
  270. };
  271. w->raw_orient=x8_get_orient_vlc(w);
  272. if(w->raw_orient<0) return -1;
  273. assert(w->raw_orient < 12 );
  274. assert(w->orient<3);
  275. w->orient=prediction_table[w->orient][w->raw_orient];
  276. }
  277. return 0;
  278. }
  279. static void x8_update_predictions(IntraX8Context * const w, const int orient, const int est_run ){
  280. MpegEncContext * const s= w->s;
  281. w->prediction_table[s->mb_x*2+(s->mb_y&1)] = (est_run<<2) + 1*(orient==4) + 2*(orient==8);
  282. /*
  283. y=2n+0 ->//0 2 4
  284. y=2n+1 ->//1 3 5
  285. */
  286. }
  287. static void x8_get_prediction_chroma(IntraX8Context * const w){
  288. MpegEncContext * const s= w->s;
  289. w->edges = 1*( !(s->mb_x>>1) );
  290. w->edges|= 2*( !(s->mb_y>>1) );
  291. w->edges|= 4*( s->mb_x >= (2*s->mb_width-1) );//mb_x for chroma would always be odd
  292. w->raw_orient=0;
  293. if(w->edges&3){//lut_co[8]={inv,4,8,8, inv,4,8,8}<- =>{1,1,0,0;1,1,0,0} => 0xCC
  294. w->chroma_orient=4<<((0xCC>>w->edges)&1);
  295. return;
  296. }
  297. w->chroma_orient = (w->prediction_table[2*s->mb_x-2] & 0x03)<<2;//block[x-1][y|1-1)]
  298. }
  299. static void x8_get_prediction(IntraX8Context * const w){
  300. MpegEncContext * const s= w->s;
  301. int a,b,c,i;
  302. w->edges = 1*( !s->mb_x );
  303. w->edges|= 2*( !s->mb_y );
  304. w->edges|= 4*( s->mb_x >= (2*s->mb_width-1) );
  305. switch(w->edges&3){
  306. case 0:
  307. break;
  308. case 1:
  309. //take the one from the above block[0][y-1]
  310. w->est_run = w->prediction_table[!(s->mb_y&1)]>>2;
  311. w->orient = 1;
  312. return;
  313. case 2:
  314. //take the one from the previous block[x-1][0]
  315. w->est_run = w->prediction_table[2*s->mb_x-2]>>2;
  316. w->orient = 2;
  317. return;
  318. case 3:
  319. w->est_run = 16;
  320. w->orient = 0;
  321. return;
  322. }
  323. //no edge cases
  324. b= w->prediction_table[2*s->mb_x + !(s->mb_y&1) ];//block[x ][y-1]
  325. a= w->prediction_table[2*s->mb_x-2 + (s->mb_y&1) ];//block[x-1][y ]
  326. c= w->prediction_table[2*s->mb_x-2 + !(s->mb_y&1) ];//block[x-1][y-1]
  327. w->est_run = FFMIN(b,a);
  328. /* This condition has nothing to do with w->edges, even if it looks
  329. similar it would trigger if e.g. x=3;y=2;
  330. I guess somebody wrote something wrong and it became standard. */
  331. if( (s->mb_x & s->mb_y) != 0 ) w->est_run=FFMIN(c,w->est_run);
  332. w->est_run>>=2;
  333. a&=3;
  334. b&=3;
  335. c&=3;
  336. i=( 0xFFEAF4C4>>(2*b+8*a) )&3;
  337. if(i!=3) w->orient=i;
  338. else w->orient=( 0xFFEAD8>>(2*c+8*(w->quant>12)) )&3;
  339. /*
  340. lut1[b][a]={
  341. ->{0, 1, 0, pad},
  342. {0, 1, X, pad},
  343. {2, 2, 2, pad}}
  344. pad 2 2 2; pad X 1 0; pad 0 1 0 <-
  345. -> 11 10 '10 10 '11 11'01 00 '11 00'01 00=>0xEAF4C4
  346. lut2[q>12][c]={
  347. ->{0,2,1,pad},
  348. {2,2,2,pad}}
  349. pad 2 2 2; pad 1 2 0 <-
  350. -> 11 10'10 10 '11 01'10 00=>0xEAD8
  351. */
  352. }
  353. static void x8_ac_compensation(IntraX8Context * const w, int const direction, int const dc_level){
  354. MpegEncContext * const s= w->s;
  355. int t;
  356. #define B(x,y) s->block[0][s->dsp.idct_permutation[(x)+(y)*8]]
  357. #define T(x) ((x) * dc_level + 0x8000) >> 16;
  358. switch(direction){
  359. case 0:
  360. t = T(3811);//h
  361. B(1,0) -= t;
  362. B(0,1) -= t;
  363. t = T(487);//e
  364. B(2,0) -= t;
  365. B(0,2) -= t;
  366. t = T(506);//f
  367. B(3,0) -= t;
  368. B(0,3) -= t;
  369. t = T(135);//c
  370. B(4,0) -= t;
  371. B(0,4) -= t;
  372. B(2,1) += t;
  373. B(1,2) += t;
  374. B(3,1) += t;
  375. B(1,3) += t;
  376. t = T(173);//d
  377. B(5,0) -= t;
  378. B(0,5) -= t;
  379. t = T(61);//b
  380. B(6,0) -= t;
  381. B(0,6) -= t;
  382. B(5,1) += t;
  383. B(1,5) += t;
  384. t = T(42); //a
  385. B(7,0) -= t;
  386. B(0,7) -= t;
  387. B(4,1) += t;
  388. B(1,4) += t;
  389. B(4,4) += t;
  390. t = T(1084);//g
  391. B(1,1) += t;
  392. s->block_last_index[0] = FFMAX(s->block_last_index[0], 7*8);
  393. break;
  394. case 1:
  395. B(0,1) -= T(6269);
  396. B(0,3) -= T( 708);
  397. B(0,5) -= T( 172);
  398. B(0,7) -= T( 73);
  399. s->block_last_index[0] = FFMAX(s->block_last_index[0], 7*8);
  400. break;
  401. case 2:
  402. B(1,0) -= T(6269);
  403. B(3,0) -= T( 708);
  404. B(5,0) -= T( 172);
  405. B(7,0) -= T( 73);
  406. s->block_last_index[0] = FFMAX(s->block_last_index[0], 7);
  407. break;
  408. }
  409. #undef B
  410. #undef T
  411. }
  412. static void dsp_x8_put_solidcolor(uint8_t const pix, uint8_t * dst, int const linesize){
  413. int k;
  414. for(k=0;k<8;k++){
  415. memset(dst,pix,8);
  416. dst+=linesize;
  417. }
  418. }
  419. static const int16_t quant_table[64] = {
  420. 256, 256, 256, 256, 256, 256, 259, 262,
  421. 265, 269, 272, 275, 278, 282, 285, 288,
  422. 292, 295, 299, 303, 306, 310, 314, 317,
  423. 321, 325, 329, 333, 337, 341, 345, 349,
  424. 353, 358, 362, 366, 371, 375, 379, 384,
  425. 389, 393, 398, 403, 408, 413, 417, 422,
  426. 428, 433, 438, 443, 448, 454, 459, 465,
  427. 470, 476, 482, 488, 493, 499, 505, 511
  428. };
  429. static int x8_decode_intra_mb(IntraX8Context* const w, const int chroma){
  430. MpegEncContext * const s= w->s;
  431. uint8_t * scantable;
  432. int final,run,level;
  433. int ac_mode,dc_mode,est_run,dc_level;
  434. int pos,n;
  435. int zeros_only;
  436. int use_quant_matrix;
  437. int sign;
  438. assert(w->orient<12);
  439. s->dsp.clear_block(s->block[0]);
  440. if(chroma){
  441. dc_mode=2;
  442. }else{
  443. dc_mode=!!w->est_run;//0,1
  444. }
  445. if(x8_get_dc_rlf(w, dc_mode, &dc_level, &final)) return -1;
  446. n=0;
  447. zeros_only=0;
  448. if(!final){//decode ac
  449. use_quant_matrix=w->use_quant_matrix;
  450. if(chroma){
  451. ac_mode = 1;
  452. est_run = 64;//not used
  453. }else{
  454. if (w->raw_orient < 3){
  455. use_quant_matrix = 0;
  456. }
  457. if(w->raw_orient > 4){
  458. ac_mode = 0;
  459. est_run = 64;
  460. }else{
  461. if(w->est_run > 1){
  462. ac_mode = 2;
  463. est_run=w->est_run;
  464. }else{
  465. ac_mode = 3;
  466. est_run = 64;
  467. }
  468. }
  469. }
  470. x8_select_ac_table(w,ac_mode);
  471. /*scantable_selector[12]={0,2,0,1,1,1,0,2,2,0,1,2};<-
  472. -> 10'01' 00'10' 10'00' 01'01' 01'00' 10'00 =>0x928548 */
  473. scantable = w->scantable[ (0x928548>>(2*w->orient))&3 ].permutated;
  474. pos=0;
  475. do {
  476. n++;
  477. if( n >= est_run ){
  478. ac_mode=3;
  479. x8_select_ac_table(w,3);
  480. }
  481. x8_get_ac_rlf(w,ac_mode,&run,&level,&final);
  482. pos+=run+1;
  483. if(pos>63){
  484. //this also handles vlc error in x8_get_ac_rlf
  485. return -1;
  486. }
  487. level= (level+1) * w->dquant;
  488. level+= w->qsum;
  489. sign = - get_bits1(&s->gb);
  490. level = (level ^ sign) - sign;
  491. if(use_quant_matrix){
  492. level = (level*quant_table[pos])>>8;
  493. }
  494. s->block[0][ scantable[pos] ]=level;
  495. }while(!final);
  496. s->block_last_index[0]=pos;
  497. }else{//DC only
  498. s->block_last_index[0]=0;
  499. if(w->flat_dc && ((unsigned)(dc_level+1)) < 3){//[-1;1]
  500. int32_t divide_quant= !chroma ? w->divide_quant_dc_luma:
  501. w->divide_quant_dc_chroma;
  502. int32_t dc_quant = !chroma ? w->quant:
  503. w->quant_dc_chroma;
  504. //original intent dc_level+=predicted_dc/quant; but it got lost somewhere in the rounding
  505. dc_level+= (w->predicted_dc*divide_quant + (1<<12) )>>13;
  506. dsp_x8_put_solidcolor( av_clip_uint8((dc_level*dc_quant+4)>>3),
  507. s->dest[chroma], s->current_picture.linesize[!!chroma]);
  508. goto block_placed;
  509. }
  510. zeros_only = (dc_level == 0);
  511. }
  512. if(!chroma){
  513. s->block[0][0] = dc_level*w->quant;
  514. }else{
  515. s->block[0][0] = dc_level*w->quant_dc_chroma;
  516. }
  517. //there is !zero_only check in the original, but dc_level check is enough
  518. if( (unsigned int)(dc_level+1) >= 3 && (w->edges&3) != 3 ){
  519. int direction;
  520. /*ac_comp_direction[orient] = { 0, 3, 3, 1, 1, 0, 0, 0, 2, 2, 2, 1 };<-
  521. -> 01'10' 10'10' 00'00' 00'01' 01'11' 11'00 =>0x6A017C */
  522. direction= (0x6A017C>>(w->orient*2))&3;
  523. if (direction != 3){
  524. x8_ac_compensation(w, direction, s->block[0][0]);//modify block_last[]
  525. }
  526. }
  527. if(w->flat_dc){
  528. dsp_x8_put_solidcolor(w->predicted_dc, s->dest[chroma], s->current_picture.linesize[!!chroma]);
  529. }else{
  530. s->dsp.x8_spatial_compensation[w->orient]( s->edge_emu_buffer,
  531. s->dest[chroma],
  532. s->current_picture.linesize[!!chroma] );
  533. }
  534. if(!zeros_only)
  535. s->dsp.idct_add ( s->dest[chroma],
  536. s->current_picture.linesize[!!chroma],
  537. s->block[0] );
  538. block_placed:
  539. if(!chroma){
  540. x8_update_predictions(w,w->orient,n);
  541. }
  542. if(s->loop_filter){
  543. uint8_t* ptr = s->dest[chroma];
  544. int linesize = s->current_picture.linesize[!!chroma];
  545. if(!( (w->edges&2) || ( zeros_only && (w->orient|4)==4 ) )){
  546. s->dsp.x8_h_loop_filter(ptr, linesize, w->quant);
  547. }
  548. if(!( (w->edges&1) || ( zeros_only && (w->orient|8)==8 ) )){
  549. s->dsp.x8_v_loop_filter(ptr, linesize, w->quant);
  550. }
  551. }
  552. return 0;
  553. }
  554. static void x8_init_block_index(MpegEncContext *s){ //FIXME maybe merge with ff_*
  555. //not s->linesize as this would be wrong for field pics
  556. //not that IntraX8 has interlacing support ;)
  557. const int linesize = s->current_picture.linesize[0];
  558. const int uvlinesize= s->current_picture.linesize[1];
  559. s->dest[0] = s->current_picture.data[0];
  560. s->dest[1] = s->current_picture.data[1];
  561. s->dest[2] = s->current_picture.data[2];
  562. s->dest[0] += s->mb_y * linesize << 3;
  563. s->dest[1] += ( s->mb_y&(~1) ) * uvlinesize << 2;//chroma blocks are on add rows
  564. s->dest[2] += ( s->mb_y&(~1) ) * uvlinesize << 2;
  565. }
  566. /**
  567. * Initialize IntraX8 frame decoder.
  568. * Requires valid MpegEncContext with valid s->mb_width before calling.
  569. * @param w pointer to IntraX8Context
  570. * @param s pointer to MpegEncContext of the parent codec
  571. */
  572. av_cold void ff_intrax8_common_init(IntraX8Context * w, MpegEncContext * const s){
  573. w->s=s;
  574. x8_vlc_init();
  575. assert(s->mb_width>0);
  576. w->prediction_table=av_mallocz(s->mb_width*2*2);//two rows, 2 blocks per cannon mb
  577. ff_init_scantable(s->dsp.idct_permutation, &w->scantable[0], wmv1_scantable[0]);
  578. ff_init_scantable(s->dsp.idct_permutation, &w->scantable[1], wmv1_scantable[2]);
  579. ff_init_scantable(s->dsp.idct_permutation, &w->scantable[2], wmv1_scantable[3]);
  580. }
  581. /**
  582. * Destroy IntraX8 frame structure.
  583. * @param w pointer to IntraX8Context
  584. */
  585. av_cold void ff_intrax8_common_end(IntraX8Context * w)
  586. {
  587. av_freep(&w->prediction_table);
  588. }
  589. /**
  590. * Decode single IntraX8 frame.
  591. * The parent codec must fill s->loopfilter and s->gb (bitstream).
  592. * The parent codec must call MPV_frame_start(), ff_er_frame_start() before calling this function.
  593. * The parent codec must call ff_er_frame_end(), MPV_frame_end() after calling this function.
  594. * This function does not use MPV_decode_mb().
  595. * lowres decoding is theoretically impossible.
  596. * @param w pointer to IntraX8Context
  597. * @param dquant doubled quantizer, it would be odd in case of VC-1 halfpq==1.
  598. * @param quant_offset offset away from zero
  599. */
  600. //FIXME extern uint8_t wmv3_dc_scale_table[32];
  601. int ff_intrax8_decode_picture(IntraX8Context * const w, int dquant, int quant_offset){
  602. MpegEncContext * const s= w->s;
  603. int mb_xy;
  604. assert(s);
  605. w->use_quant_matrix = get_bits1(&s->gb);
  606. w->dquant = dquant;
  607. w->quant = dquant >> 1;
  608. w->qsum = quant_offset;
  609. w->divide_quant_dc_luma = ((1<<16) + (w->quant>>1)) / w->quant;
  610. if(w->quant < 5){
  611. w->quant_dc_chroma = w->quant;
  612. w->divide_quant_dc_chroma = w->divide_quant_dc_luma;
  613. }else{
  614. w->quant_dc_chroma = w->quant+((w->quant+3)>>3);
  615. w->divide_quant_dc_chroma = ((1<<16) + (w->quant_dc_chroma>>1)) / w->quant_dc_chroma;
  616. }
  617. x8_reset_vlc_tables(w);
  618. s->resync_mb_x=0;
  619. s->resync_mb_y=0;
  620. for(s->mb_y=0; s->mb_y < s->mb_height*2; s->mb_y++){
  621. x8_init_block_index(s);
  622. mb_xy=(s->mb_y>>1)*s->mb_stride;
  623. for(s->mb_x=0; s->mb_x < s->mb_width*2; s->mb_x++){
  624. x8_get_prediction(w);
  625. if(x8_setup_spatial_predictor(w,0)) goto error;
  626. if(x8_decode_intra_mb(w,0)) goto error;
  627. if( s->mb_x & s->mb_y & 1 ){
  628. x8_get_prediction_chroma(w);
  629. /*when setting up chroma, no vlc is read,
  630. so no error condition can be reached*/
  631. x8_setup_spatial_predictor(w,1);
  632. if(x8_decode_intra_mb(w,1)) goto error;
  633. x8_setup_spatial_predictor(w,2);
  634. if(x8_decode_intra_mb(w,2)) goto error;
  635. s->dest[1]+= 8;
  636. s->dest[2]+= 8;
  637. /*emulate MB info in the relevant tables*/
  638. s->mbskip_table [mb_xy]=0;
  639. s->mbintra_table[mb_xy]=1;
  640. s->current_picture.qscale_table[mb_xy]=w->quant;
  641. mb_xy++;
  642. }
  643. s->dest[0]+= 8;
  644. }
  645. if(s->mb_y&1){
  646. ff_draw_horiz_band(s, (s->mb_y-1)*8, 16);
  647. }
  648. }
  649. error:
  650. ff_er_add_slice(s, s->resync_mb_x, s->resync_mb_y,
  651. (s->mb_x>>1)-1, (s->mb_y>>1)-1,
  652. (AC_END|DC_END|MV_END) );
  653. return 0;
  654. }