47 const unsigned lt = src[-1-1*
stride];
50 uint32_t v =
PACK_4U8((lt + 2*t0 + t1 + 2) >> 2,
51 (t0 + 2*t1 + t2 + 2) >> 2,
52 (t1 + 2*t2 + t3 + 2) >> 2,
53 (t2 + 2*t3 + t4 + 2) >> 2);
64 const unsigned lt = src[-1-1*
stride];
67 AV_WN32A(src+0*stride, ((lt + 2*l0 + l1 + 2) >> 2)*0x01010101);
68 AV_WN32A(src+1*stride, ((l0 + 2*l1 + l2 + 2) >> 2)*0x01010101);
69 AV_WN32A(src+2*stride, ((l1 + 2*l2 + l3 + 2) >> 2)*0x01010101);
70 AV_WN32A(src+3*stride, ((l2 + 2*l3 + l3 + 2) >> 2)*0x01010101);
79 src[0+0*
stride]=(l1 + t1)>>1;
81 src[0+1*
stride]=(l2 + t2)>>1;
94 src[3+3*
stride]=(l3 + t3)>>1;
105 src[0+0*
stride]=(t0 + t2 + 2*t1 + 2 + l0 + l2 + 2*l1 + 2)>>3;
107 src[0+1*
stride]=(t1 + t3 + 2*t2 + 2 + l1 + l3 + 2*l2 + 2)>>3;
110 src[0+2*
stride]=(t2 + t4 + 2*t3 + 2 + l2 + l4 + 2*l3 + 2)>>3;
114 src[0+3*
stride]=(t3 + t5 + 2*t4 + 2 + l3 + l5 + 2*l4 + 2)>>3;
117 src[1+3*
stride]=(t4 + t6 + 2*t5 + 2 + l4 + l6 + 2*l5 + 2)>>3;
119 src[2+3*
stride]=(t5 + t7 + 2*t6 + 2 + l5 + l7 + 2*l6 + 2)>>3;
120 src[3+3*
stride]=(t6 + t7 + 1 + l6 + l7 + 1)>>2;
131 src[0+0*
stride]=(t0 + t2 + 2*t1 + 2 + l0 + l2 + 2*l1 + 2)>>3;
133 src[0+1*
stride]=(t1 + t3 + 2*t2 + 2 + l1 + l3 + 2*l2 + 2)>>3;
136 src[0+2*
stride]=(t2 + t4 + 2*t3 + 2 + l2 + 3*l3 + 2)>>3;
140 src[0+3*
stride]=(t3 + t5 + 2*t4 + 2 + l3*4 + 2)>>3;
143 src[1+3*
stride]=(t4 + t6 + 2*t5 + 2 + l3*4 + 2)>>3;
145 src[2+3*
stride]=(t5 + t7 + 2*t6 + 2 + l3*4 + 2)>>3;
146 src[3+3*
stride]=(t6 + t7 + 1 + 2*l3 + 1)>>2;
151 const int l0,
const int l1,
const int l2,
152 const int l3,
const int l4)
157 src[0+0*
stride]=(2*t0 + 2*t1 + l1 + 2*l2 + l3 + 4)>>3;
159 src[0+2*
stride]=(t1 + t2 + 1)>>1;
161 src[1+2*
stride]=(t2 + t3 + 1)>>1;
163 src[2+2*
stride]=(t3 + t4+ 1)>>1;
164 src[3+2*
stride]=(t4 + t5+ 1)>>1;
165 src[0+1*
stride]=(t0 + 2*t1 + t2 + l2 + 2*l3 + l4 + 4)>>3;
167 src[0+3*
stride]=(t1 + 2*t2 + t3 + 2)>>2;
169 src[1+3*
stride]=(t2 + 2*t3 + t4 + 2)>>2;
171 src[2+3*
stride]=(t3 + 2*t4 + t5 + 2)>>2;
172 src[3+3*
stride]=(t4 + 2*t5 + t6 + 2)>>2;
199 src[0+0*
stride]=(t0 + t1 + 1)>>1;
201 src[0+2*
stride]=(t1 + t2 + 1)>>1;
203 src[1+2*
stride]=(t2 + t3 + 1)>>1;
205 src[2+2*
stride]=(t3 + t4 + 1)>>1;
206 src[0+1*
stride]=(t0 + 2*t1 + t2 + 2)>>2;
208 src[0+3*
stride]=(t1 + 2*t2 + t3 + 2)>>2;
210 src[1+3*
stride]=(t2 + 2*t3 + t4 + 2)>>2;
212 src[2+3*
stride]=(t3 + 2*t4 + t5 + 2)>>2;
213 src[3+2*
stride]=(t4 + 2*t5 + t6 + 2)>>2;
214 src[3+3*
stride]=(t5 + 2*t6 + t7 + 2)>>2;
225 src[0+0*
stride]=(t1 + 2*t2 + t3 + 2*l0 + 2*l1 + 4)>>3;
226 src[1+0*
stride]=(t2 + 2*t3 + t4 + l0 + 2*l1 + l2 + 4)>>3;
228 src[0+1*
stride]=(t3 + 2*t4 + t5 + 2*l1 + 2*l2 + 4)>>3;
230 src[1+1*
stride]=(t4 + 2*t5 + t6 + l1 + 2*l2 + l3 + 4)>>3;
232 src[0+2*
stride]=(t5 + 2*t6 + t7 + 2*l2 + 2*l3 + 4)>>3;
234 src[1+2*
stride]=(t6 + 3*t7 + l2 + 3*l3 + 4)>>3;
236 src[1+3*
stride]=(l3 + 2*l4 + l5 + 2)>>2;
238 src[2+2*
stride]=(t6 + t7 + l3 + l4 + 2)>>2;
239 src[2+3*
stride]=(l4 + l5 + 1)>>1;
240 src[3+3*
stride]=(l4 + 2*l5 + l6 + 2)>>2;
251 src[0+0*
stride]=(t1 + 2*t2 + t3 + 2*l0 + 2*l1 + 4)>>3;
252 src[1+0*
stride]=(t2 + 2*t3 + t4 + l0 + 2*l1 + l2 + 4)>>3;
254 src[0+1*
stride]=(t3 + 2*t4 + t5 + 2*l1 + 2*l2 + 4)>>3;
256 src[1+1*
stride]=(t4 + 2*t5 + t6 + l1 + 2*l2 + l3 + 4)>>3;
258 src[0+2*
stride]=(t5 + 2*t6 + t7 + 2*l2 + 2*l3 + 4)>>3;
260 src[1+2*
stride]=(t6 + 3*t7 + l2 + 3*l3 + 4)>>3;
264 src[2+2*
stride]=(t6 + t7 + 2*l3 + 2)>>2;
276 for (y = 0; y < 4; y++) {
277 const uint8_t *cm_in = cm + src[-1];
278 src[0] = cm_in[top[0]];
279 src[1] = cm_in[top[1]];
280 src[2] = cm_in[top[2]];
281 src[3] = cm_in[top[3]];
288 pred16x16_plane_compat_8_c(src, stride, 1, 0);
293 pred16x16_plane_compat_8_c(src, stride, 0, 1);
302 for (y = 0; y < 16; y++) {
303 const uint8_t *cm_in = cm + src[-1];
304 src[0] = cm_in[top[0]];
305 src[1] = cm_in[top[1]];
306 src[2] = cm_in[top[2]];
307 src[3] = cm_in[top[3]];
308 src[4] = cm_in[top[4]];
309 src[5] = cm_in[top[5]];
310 src[6] = cm_in[top[6]];
311 src[7] = cm_in[top[7]];
312 src[8] = cm_in[top[8]];
313 src[9] = cm_in[top[9]];
314 src[10] = cm_in[top[10]];
315 src[11] = cm_in[top[11]];
316 src[12] = cm_in[top[12]];
317 src[13] = cm_in[top[13]];
318 src[14] = cm_in[top[14]];
319 src[15] = cm_in[top[15]];
331 dc0+= src[-1+i*stride];
332 dc0= 0x01010101*((dc0 + 4)>>3);
335 ((uint32_t*)(src+i*stride))[0]=
336 ((uint32_t*)(src+i*
stride))[1]= dc0;
348 dc0= 0x01010101*((dc0 + 4)>>3);
351 ((uint32_t*)(src+i*stride))[0]=
352 ((uint32_t*)(src+i*
stride))[1]= dc0;
364 dc0+= src[-1+(i+4)*stride];
366 dc0= 0x01010101*((dc0 + 8)>>4);
369 ((uint32_t*)(src+i*stride))[0]= dc0;
370 ((uint32_t*)(src+i*stride))[1]= dc0;
373 ((uint32_t*)(src+i*stride))[0]= dc0;
374 ((uint32_t*)(src+i*stride))[1]= dc0;
384 for (y = 0; y < 8; y++) {
385 const uint8_t *cm_in = cm + src[-1];
386 src[0] = cm_in[top[0]];
387 src[1] = cm_in[top[1]];
388 src[2] = cm_in[top[2]];
389 src[3] = cm_in[top[3]];
390 src[4] = cm_in[top[4]];
391 src[5] = cm_in[top[5]];
392 src[6] = cm_in[top[6]];
393 src[7] = cm_in[top[7]];
403 const int chroma_format_idc)
407 #define FUNC(a, depth) a ## _ ## depth
408 #define FUNCC(a, depth) a ## _ ## depth ## _c
409 #define FUNCD(a) a ## _c
411 #define H264_PRED(depth) \
412 if(codec_id != AV_CODEC_ID_RV40){\
413 if(codec_id == AV_CODEC_ID_VP8) {\
414 h->pred4x4[VERT_PRED ]= FUNCD(pred4x4_vertical_vp8);\
415 h->pred4x4[HOR_PRED ]= FUNCD(pred4x4_horizontal_vp8);\
417 h->pred4x4[VERT_PRED ]= FUNCC(pred4x4_vertical , depth);\
418 h->pred4x4[HOR_PRED ]= FUNCC(pred4x4_horizontal , depth);\
420 h->pred4x4[DC_PRED ]= FUNCC(pred4x4_dc , depth);\
421 if(codec_id == AV_CODEC_ID_SVQ3)\
422 h->pred4x4[DIAG_DOWN_LEFT_PRED ]= FUNCD(pred4x4_down_left_svq3);\
424 h->pred4x4[DIAG_DOWN_LEFT_PRED ]= FUNCC(pred4x4_down_left , depth);\
425 h->pred4x4[DIAG_DOWN_RIGHT_PRED]= FUNCC(pred4x4_down_right , depth);\
426 h->pred4x4[VERT_RIGHT_PRED ]= FUNCC(pred4x4_vertical_right , depth);\
427 h->pred4x4[HOR_DOWN_PRED ]= FUNCC(pred4x4_horizontal_down , depth);\
428 if (codec_id == AV_CODEC_ID_VP8) {\
429 h->pred4x4[VERT_LEFT_PRED ]= FUNCD(pred4x4_vertical_left_vp8);\
431 h->pred4x4[VERT_LEFT_PRED ]= FUNCC(pred4x4_vertical_left , depth);\
432 h->pred4x4[HOR_UP_PRED ]= FUNCC(pred4x4_horizontal_up , depth);\
433 if(codec_id != AV_CODEC_ID_VP8) {\
434 h->pred4x4[LEFT_DC_PRED ]= FUNCC(pred4x4_left_dc , depth);\
435 h->pred4x4[TOP_DC_PRED ]= FUNCC(pred4x4_top_dc , depth);\
436 h->pred4x4[DC_128_PRED ]= FUNCC(pred4x4_128_dc , depth);\
438 h->pred4x4[TM_VP8_PRED ]= FUNCD(pred4x4_tm_vp8);\
439 h->pred4x4[DC_127_PRED ]= FUNCC(pred4x4_127_dc , depth);\
440 h->pred4x4[DC_129_PRED ]= FUNCC(pred4x4_129_dc , depth);\
441 h->pred4x4[VERT_VP8_PRED ]= FUNCC(pred4x4_vertical , depth);\
442 h->pred4x4[HOR_VP8_PRED ]= FUNCC(pred4x4_horizontal , depth);\
445 h->pred4x4[VERT_PRED ]= FUNCC(pred4x4_vertical , depth);\
446 h->pred4x4[HOR_PRED ]= FUNCC(pred4x4_horizontal , depth);\
447 h->pred4x4[DC_PRED ]= FUNCC(pred4x4_dc , depth);\
448 h->pred4x4[DIAG_DOWN_LEFT_PRED ]= FUNCD(pred4x4_down_left_rv40);\
449 h->pred4x4[DIAG_DOWN_RIGHT_PRED]= FUNCC(pred4x4_down_right , depth);\
450 h->pred4x4[VERT_RIGHT_PRED ]= FUNCC(pred4x4_vertical_right , depth);\
451 h->pred4x4[HOR_DOWN_PRED ]= FUNCC(pred4x4_horizontal_down , depth);\
452 h->pred4x4[VERT_LEFT_PRED ]= FUNCD(pred4x4_vertical_left_rv40);\
453 h->pred4x4[HOR_UP_PRED ]= FUNCD(pred4x4_horizontal_up_rv40);\
454 h->pred4x4[LEFT_DC_PRED ]= FUNCC(pred4x4_left_dc , depth);\
455 h->pred4x4[TOP_DC_PRED ]= FUNCC(pred4x4_top_dc , depth);\
456 h->pred4x4[DC_128_PRED ]= FUNCC(pred4x4_128_dc , depth);\
457 h->pred4x4[DIAG_DOWN_LEFT_PRED_RV40_NODOWN]= FUNCD(pred4x4_down_left_rv40_nodown);\
458 h->pred4x4[HOR_UP_PRED_RV40_NODOWN]= FUNCD(pred4x4_horizontal_up_rv40_nodown);\
459 h->pred4x4[VERT_LEFT_PRED_RV40_NODOWN]= FUNCD(pred4x4_vertical_left_rv40_nodown);\
462 h->pred8x8l[VERT_PRED ]= FUNCC(pred8x8l_vertical , depth);\
463 h->pred8x8l[HOR_PRED ]= FUNCC(pred8x8l_horizontal , depth);\
464 h->pred8x8l[DC_PRED ]= FUNCC(pred8x8l_dc , depth);\
465 h->pred8x8l[DIAG_DOWN_LEFT_PRED ]= FUNCC(pred8x8l_down_left , depth);\
466 h->pred8x8l[DIAG_DOWN_RIGHT_PRED]= FUNCC(pred8x8l_down_right , depth);\
467 h->pred8x8l[VERT_RIGHT_PRED ]= FUNCC(pred8x8l_vertical_right , depth);\
468 h->pred8x8l[HOR_DOWN_PRED ]= FUNCC(pred8x8l_horizontal_down , depth);\
469 h->pred8x8l[VERT_LEFT_PRED ]= FUNCC(pred8x8l_vertical_left , depth);\
470 h->pred8x8l[HOR_UP_PRED ]= FUNCC(pred8x8l_horizontal_up , depth);\
471 h->pred8x8l[LEFT_DC_PRED ]= FUNCC(pred8x8l_left_dc , depth);\
472 h->pred8x8l[TOP_DC_PRED ]= FUNCC(pred8x8l_top_dc , depth);\
473 h->pred8x8l[DC_128_PRED ]= FUNCC(pred8x8l_128_dc , depth);\
475 if (chroma_format_idc <= 1) {\
476 h->pred8x8[VERT_PRED8x8 ]= FUNCC(pred8x8_vertical , depth);\
477 h->pred8x8[HOR_PRED8x8 ]= FUNCC(pred8x8_horizontal , depth);\
479 h->pred8x8[VERT_PRED8x8 ]= FUNCC(pred8x16_vertical , depth);\
480 h->pred8x8[HOR_PRED8x8 ]= FUNCC(pred8x16_horizontal , depth);\
482 if (codec_id != AV_CODEC_ID_VP8) {\
483 if (chroma_format_idc <= 1) {\
484 h->pred8x8[PLANE_PRED8x8]= FUNCC(pred8x8_plane , depth);\
486 h->pred8x8[PLANE_PRED8x8]= FUNCC(pred8x16_plane , depth);\
489 h->pred8x8[PLANE_PRED8x8]= FUNCD(pred8x8_tm_vp8);\
490 if(codec_id != AV_CODEC_ID_RV40 && codec_id != AV_CODEC_ID_VP8){\
491 if (chroma_format_idc <= 1) {\
492 h->pred8x8[DC_PRED8x8 ]= FUNCC(pred8x8_dc , depth);\
493 h->pred8x8[LEFT_DC_PRED8x8]= FUNCC(pred8x8_left_dc , depth);\
494 h->pred8x8[TOP_DC_PRED8x8 ]= FUNCC(pred8x8_top_dc , depth);\
495 h->pred8x8[ALZHEIMER_DC_L0T_PRED8x8 ]= FUNC(pred8x8_mad_cow_dc_l0t, depth);\
496 h->pred8x8[ALZHEIMER_DC_0LT_PRED8x8 ]= FUNC(pred8x8_mad_cow_dc_0lt, depth);\
497 h->pred8x8[ALZHEIMER_DC_L00_PRED8x8 ]= FUNC(pred8x8_mad_cow_dc_l00, depth);\
498 h->pred8x8[ALZHEIMER_DC_0L0_PRED8x8 ]= FUNC(pred8x8_mad_cow_dc_0l0, depth);\
500 h->pred8x8[DC_PRED8x8 ]= FUNCC(pred8x16_dc , depth);\
501 h->pred8x8[LEFT_DC_PRED8x8]= FUNCC(pred8x16_left_dc , depth);\
502 h->pred8x8[TOP_DC_PRED8x8 ]= FUNCC(pred8x16_top_dc , depth);\
503 h->pred8x8[ALZHEIMER_DC_L0T_PRED8x8 ]= FUNC(pred8x16_mad_cow_dc_l0t, depth);\
504 h->pred8x8[ALZHEIMER_DC_0LT_PRED8x8 ]= FUNC(pred8x16_mad_cow_dc_0lt, depth);\
505 h->pred8x8[ALZHEIMER_DC_L00_PRED8x8 ]= FUNC(pred8x16_mad_cow_dc_l00, depth);\
506 h->pred8x8[ALZHEIMER_DC_0L0_PRED8x8 ]= FUNC(pred8x16_mad_cow_dc_0l0, depth);\
509 h->pred8x8[DC_PRED8x8 ]= FUNCD(pred8x8_dc_rv40);\
510 h->pred8x8[LEFT_DC_PRED8x8]= FUNCD(pred8x8_left_dc_rv40);\
511 h->pred8x8[TOP_DC_PRED8x8 ]= FUNCD(pred8x8_top_dc_rv40);\
512 if (codec_id == AV_CODEC_ID_VP8) {\
513 h->pred8x8[DC_127_PRED8x8]= FUNCC(pred8x8_127_dc , depth);\
514 h->pred8x8[DC_129_PRED8x8]= FUNCC(pred8x8_129_dc , depth);\
517 if (chroma_format_idc <= 1) {\
518 h->pred8x8[DC_128_PRED8x8 ]= FUNCC(pred8x8_128_dc , depth);\
520 h->pred8x8[DC_128_PRED8x8 ]= FUNCC(pred8x16_128_dc , depth);\
523 h->pred16x16[DC_PRED8x8 ]= FUNCC(pred16x16_dc , depth);\
524 h->pred16x16[VERT_PRED8x8 ]= FUNCC(pred16x16_vertical , depth);\
525 h->pred16x16[HOR_PRED8x8 ]= FUNCC(pred16x16_horizontal , depth);\
527 case AV_CODEC_ID_SVQ3:\
528 h->pred16x16[PLANE_PRED8x8 ]= FUNCD(pred16x16_plane_svq3);\
530 case AV_CODEC_ID_RV40:\
531 h->pred16x16[PLANE_PRED8x8 ]= FUNCD(pred16x16_plane_rv40);\
533 case AV_CODEC_ID_VP8:\
534 h->pred16x16[PLANE_PRED8x8 ]= FUNCD(pred16x16_tm_vp8);\
535 h->pred16x16[DC_127_PRED8x8]= FUNCC(pred16x16_127_dc , depth);\
536 h->pred16x16[DC_129_PRED8x8]= FUNCC(pred16x16_129_dc , depth);\
539 h->pred16x16[PLANE_PRED8x8 ]= FUNCC(pred16x16_plane , depth);\
542 h->pred16x16[LEFT_DC_PRED8x8]= FUNCC(pred16x16_left_dc , depth);\
543 h->pred16x16[TOP_DC_PRED8x8 ]= FUNCC(pred16x16_top_dc , depth);\
544 h->pred16x16[DC_128_PRED8x8 ]= FUNCC(pred16x16_128_dc , depth);\
547 h->pred4x4_add [VERT_PRED ]= FUNCC(pred4x4_vertical_add , depth);\
548 h->pred4x4_add [ HOR_PRED ]= FUNCC(pred4x4_horizontal_add , depth);\
549 h->pred8x8l_add [VERT_PRED ]= FUNCC(pred8x8l_vertical_add , depth);\
550 h->pred8x8l_add [ HOR_PRED ]= FUNCC(pred8x8l_horizontal_add , depth);\
551 if (chroma_format_idc <= 1) {\
552 h->pred8x8_add [VERT_PRED8x8]= FUNCC(pred8x8_vertical_add , depth);\
553 h->pred8x8_add [ HOR_PRED8x8]= FUNCC(pred8x8_horizontal_add , depth);\
555 h->pred8x8_add [VERT_PRED8x8]= FUNCC(pred8x16_vertical_add , depth);\
556 h->pred8x8_add [ HOR_PRED8x8]= FUNCC(pred8x16_horizontal_add , depth);\
558 h->pred16x16_add[VERT_PRED8x8]= FUNCC(pred16x16_vertical_add , depth);\
559 h->pred16x16_add[ HOR_PRED8x8]= FUNCC(pred16x16_horizontal_add , depth);\