39 int src_x,
int src_y,
int src_stride,
slice_buffer * sb,
int add, uint8_t * dst8){
44 const uint8_t *obmc1= obmc + y*obmc_stride;
45 const uint8_t *obmc2= obmc1+ (obmc_stride>>1);
46 const uint8_t *obmc3= obmc1+ obmc_stride*(obmc_stride>>1);
47 const uint8_t *
obmc4= obmc3+ (obmc_stride>>1);
50 int v= obmc1[x] * block[3][x + y*src_stride]
51 +obmc2[x] * block[2][x + y*src_stride]
52 +obmc3[x] * block[1][x + y*src_stride]
53 +obmc4[x] * block[0][x + y*src_stride];
62 if(v&(~255)) v= ~(v>>31);
63 dst8[x + y*src_stride] =
v;
72 int plane_index,
level, orientation;
74 for(plane_index=0; plane_index<3; plane_index++){
76 for(orientation=level ? 1:0; orientation<4; orientation++){
101 for(i=0; i<
QROOT; i++){
103 v *= pow(2, 1.0 / QROOT);
106 static void mc_block(
Plane *p, uint8_t *dst,
const uint8_t *src,
int stride,
int b_w,
int b_h,
int dx,
int dy){
107 static const uint8_t weight[64]={
118 static const uint8_t brane[256]={
119 0x00,0x01,0x01,0x01,0x01,0x01,0x01,0x01,0x11,0x12,0x12,0x12,0x12,0x12,0x12,0x12,
120 0x04,0x05,0xcc,0xcc,0xcc,0xcc,0xcc,0x41,0x15,0x16,0xcc,0xcc,0xcc,0xcc,0xcc,0x52,
121 0x04,0xcc,0x05,0xcc,0xcc,0xcc,0x41,0xcc,0x15,0xcc,0x16,0xcc,0xcc,0xcc,0x52,0xcc,
122 0x04,0xcc,0xcc,0x05,0xcc,0x41,0xcc,0xcc,0x15,0xcc,0xcc,0x16,0xcc,0x52,0xcc,0xcc,
123 0x04,0xcc,0xcc,0xcc,0x41,0xcc,0xcc,0xcc,0x15,0xcc,0xcc,0xcc,0x16,0xcc,0xcc,0xcc,
124 0x04,0xcc,0xcc,0x41,0xcc,0x05,0xcc,0xcc,0x15,0xcc,0xcc,0x52,0xcc,0x16,0xcc,0xcc,
125 0x04,0xcc,0x41,0xcc,0xcc,0xcc,0x05,0xcc,0x15,0xcc,0x52,0xcc,0xcc,0xcc,0x16,0xcc,
126 0x04,0x41,0xcc,0xcc,0xcc,0xcc,0xcc,0x05,0x15,0x52,0xcc,0xcc,0xcc,0xcc,0xcc,0x16,
127 0x44,0x45,0x45,0x45,0x45,0x45,0x45,0x45,0x55,0x56,0x56,0x56,0x56,0x56,0x56,0x56,
128 0x48,0x49,0xcc,0xcc,0xcc,0xcc,0xcc,0x85,0x59,0x5A,0xcc,0xcc,0xcc,0xcc,0xcc,0x96,
129 0x48,0xcc,0x49,0xcc,0xcc,0xcc,0x85,0xcc,0x59,0xcc,0x5A,0xcc,0xcc,0xcc,0x96,0xcc,
130 0x48,0xcc,0xcc,0x49,0xcc,0x85,0xcc,0xcc,0x59,0xcc,0xcc,0x5A,0xcc,0x96,0xcc,0xcc,
131 0x48,0xcc,0xcc,0xcc,0x49,0xcc,0xcc,0xcc,0x59,0xcc,0xcc,0xcc,0x96,0xcc,0xcc,0xcc,
132 0x48,0xcc,0xcc,0x85,0xcc,0x49,0xcc,0xcc,0x59,0xcc,0xcc,0x96,0xcc,0x5A,0xcc,0xcc,
133 0x48,0xcc,0x85,0xcc,0xcc,0xcc,0x49,0xcc,0x59,0xcc,0x96,0xcc,0xcc,0xcc,0x5A,0xcc,
134 0x48,0x85,0xcc,0xcc,0xcc,0xcc,0xcc,0x49,0x59,0x96,0xcc,0xcc,0xcc,0xcc,0xcc,0x5A,
137 static const uint8_t needs[16]={
147 int16_t *tmpI= tmpIt;
148 uint8_t *tmp2= tmp2t[0];
149 const uint8_t *hpel[11];
150 assert(dx<16 && dy<16);
151 r= brane[dx + 16*dy]&15;
152 l= brane[dx + 16*dy]>>4;
154 b= needs[l] | needs[
r];
160 for(x=0; x < b_w; x++){
161 int a_1=src[x + HTAPS_MAX/2-4];
162 int a0= src[x + HTAPS_MAX/2-3];
163 int a1= src[x + HTAPS_MAX/2-2];
164 int a2= src[x + HTAPS_MAX/2-1];
165 int a3= src[x + HTAPS_MAX/2+0];
166 int a4= src[x + HTAPS_MAX/2+1];
167 int a5= src[x + HTAPS_MAX/2+2];
168 int a6= src[x + HTAPS_MAX/2+3];
171 am= 20*(a2+
a3) - 5*(a1+a4) + (a0+
a5);
180 if(am&(~255)) am= ~(am>>31);
193 for(y=0; y < b_h; y++){
194 for(x=0; x < b_w+1; x++){
205 am= (20*(a2+
a3) - 5*(a1+a4) + (a0+
a5) + 16)>>5;
209 if(am&(~255)) am= ~(am>>31);
221 for(y=0; y < b_h; y++){
222 for(x=0; x < b_w; x++){
233 am= (20*(a2+
a3) - 5*(a1+a4) + (a0+
a5) + 512)>>10;
236 if(am&(~255)) am= ~(am>>31);
245 hpel[ 1]= tmp2t[0] + stride*(
HTAPS_MAX/2-1);
250 hpel[ 6]= tmp2t[1] + 1;
253 hpel[ 9]= hpel[1] +
stride;
254 hpel[10]= hpel[8] + 1;
257 const uint8_t *src1= hpel[dx/8 + dy/8*4 ];
258 const uint8_t *src2= hpel[dx/8 + dy/8*4+1];
259 const uint8_t *src3= hpel[dx/8 + dy/8*4+4];
260 const uint8_t *src4= hpel[dx/8 + dy/8*4+5];
263 for(y=0; y < b_h; y++){
264 for(x=0; x < b_w; x++){
265 dst[x]= ((8-dx)*(8-dy)*src1[x] + dx*(8-dy)*src2[x]+
266 (8-dx)* dy *src3[x] + dx* dy *src4[x]+32)>>6;
275 const uint8_t *src1= hpel[l];
276 const uint8_t *src2= hpel[
r];
277 int a= weight[((dx&7) + (8*(dy&7)))];
279 for(y=0; y < b_h; y++){
280 for(x=0; x < b_w; x++){
281 dst[x]= (a*src1[x] + b*src2[x] + 4)>>3;
290 void ff_snow_pred_block(
SnowContext *s, uint8_t *dst, uint8_t *tmp,
int stride,
int sx,
int sy,
int b_w,
int b_h,
BlockNode *
block,
int plane_index,
int w,
int h){
293 const unsigned color = block->
color[plane_index];
294 const unsigned color4 = color*0x01010101;
296 for(y=0; y < b_h; y++){
297 *(uint32_t*)&dst[0 + y*stride]= color4;
298 *(uint32_t*)&dst[4 + y*stride]= color4;
299 *(uint32_t*)&dst[8 + y*stride]= color4;
300 *(uint32_t*)&dst[12+ y*stride]= color4;
301 *(uint32_t*)&dst[16+ y*stride]= color4;
302 *(uint32_t*)&dst[20+ y*stride]= color4;
303 *(uint32_t*)&dst[24+ y*stride]= color4;
304 *(uint32_t*)&dst[28+ y*stride]= color4;
307 for(y=0; y < b_h; y++){
308 *(uint32_t*)&dst[0 + y*stride]= color4;
309 *(uint32_t*)&dst[4 + y*stride]= color4;
310 *(uint32_t*)&dst[8 + y*stride]= color4;
311 *(uint32_t*)&dst[12+ y*stride]= color4;
314 for(y=0; y < b_h; y++){
315 *(uint32_t*)&dst[0 + y*stride]= color4;
316 *(uint32_t*)&dst[4 + y*stride]= color4;
319 for(y=0; y < b_h; y++){
320 *(uint32_t*)&dst[0 + y*stride]= color4;
323 for(y=0; y < b_h; y++){
324 for(x=0; x < b_w; x++){
336 const int tab_index= 3 - (b_w>>2) + (b_w>>4);
340 if( (
unsigned)sx >= w - b_w - (
HTAPS_MAX-2)
341 || (
unsigned)sy >= h - b_h - (
HTAPS_MAX-2)){
347 assert(b_w>1 && b_h>1);
348 assert((tab_index>=0 && tab_index<4) || b_w==32);
349 if((dx&3) || (dy&3) || !(b_w == b_h || 2*b_w == b_h || b_w == 2*b_h) || (b_w&(b_w-1)) || !s->
plane[plane_index].
fast_mc )
350 mc_block(&s->
plane[plane_index], dst, src, stride, b_w, b_h, dx, dy);
353 for(y=0; y<b_h; y+=16){
370 #define mca(dx,dy,b_w)\
371 static void mc_block_hpel ## dx ## dy ## b_w(uint8_t *dst, const uint8_t *src, int stride, int h){\
373 mc_block(NULL, dst, src-(HTAPS_MAX/2-1)-(HTAPS_MAX/2-1)*stride, stride, b_w, b_w, dx, dy);\
397 s->dsp.put_qpel_pixels_tab [0][dy+dx/4]=\
398 s->dsp.put_no_rnd_qpel_pixels_tab[0][dy+dx/4]=\
399 s->dsp.put_h264_qpel_pixels_tab[0][dy+dx/4];\
400 s->dsp.put_qpel_pixels_tab [1][dy+dx/4]=\
401 s->dsp.put_no_rnd_qpel_pixels_tab[1][dy+dx/4]=\
402 s->dsp.put_h264_qpel_pixels_tab[1][dy+dx/4];
422 s->dsp.put_pixels_tab [0][dy/4+dx/8]=\
423 s->dsp.put_no_rnd_pixels_tab[0][dy/4+dx/8]=\
424 mc_block_hpel ## dx ## dy ## 16;\
425 s->dsp.put_pixels_tab [1][dy/4+dx/8]=\
426 s->dsp.put_no_rnd_pixels_tab[1][dy/4+dx/8]=\
427 mc_block_hpel ## dx ## dy ## 8;
461 int plane_index,
level, orientation;
463 for(plane_index=0; plane_index<3; plane_index++){
475 for(orientation=level ? 1 : 0; orientation<4; orientation++){
481 b->
width = (w + !(orientation&1))>>1;
482 b->
height= (h + !(orientation>1))>>1;
512 #define USE_HALFPEL_PLANE 0
522 uint8_t *src= frame->
data[p];
533 halfpel[1][p][i]= (20*(src[i] + src[i+1]) - 5*(src[i-1] + src[i+2]) + (src[i-2] + src[i+3]) + 16 )>>5;
540 halfpel[2][p][i]= (20*(src[i] + src[i+ls]) - 5*(src[i-ls] + src[i+2*ls]) + (src[i-2*ls] + src[i+3*ls]) + 16 )>>5;
548 halfpel[3][p][i]= (20*(src[i] + src[i+ls]) - 5*(src[i-ls] + src[i+2*ls]) + (src[i-2*ls] + src[i+3*ls]) + 16 )>>5;
623 int plane_index,
level, orientation, i;
644 for(plane_index=0; plane_index<3; plane_index++){
646 for(orientation=level ? 1 : 0; orientation<4; orientation++){