Home
last modified time | relevance | path

Searched refs:mm4 (Results 1 – 25 of 84) sorted by relevance

1234

/third_party/libjpeg-turbo/simd/loongson/
Djdcolext-mmi.c42 #define mmA mm4
56 #define mmC mm4
70 #define mmE mm4
84 #define mmG mm4
98 __m64 mm0, mm1, mm2, mm3, mm4, mm5, mm6, mm7; in jsimd_ycc_rgb_convert_mmi() local
114 mm4 = 0; in jsimd_ycc_rgb_convert_mmi()
116 mm4 = _mm_cmpeq_pi16(mm4, mm4); in jsimd_ycc_rgb_convert_mmi()
118 mm4 = _mm_srli_pi16(mm4, BYTE_BIT); in jsimd_ycc_rgb_convert_mmi()
120 mm0 = mm4; /* mm0=mm4={0xFF 0x00 0xFF 0x00 ..} */ in jsimd_ycc_rgb_convert_mmi()
122 mm4 = _mm_and_si64(mm4, mm5); /* mm4=Cb(0246)=CbE */ in jsimd_ycc_rgb_convert_mmi()
[all …]
Djccolext-mmi.c43 #define mmA mm4
57 #define mmC mm4
71 #define mmE mm4
85 #define mmG mm4
99 __m64 mm0, mm1, mm2, mm3, mm4, mm5, mm6, mm7; in jsimd_rgb_ycc_convert_mmi() local
329 wk[2] = mm4; in jsimd_rgb_ycc_convert_mmi()
336 mm4 = mm6; in jsimd_rgb_ycc_convert_mmi()
340 mm4 = _mm_madd_pi16(mm4, PW_MF016_MF033); in jsimd_rgb_ycc_convert_mmi()
352 mm4 = _mm_add_pi32(mm4, mm6); in jsimd_rgb_ycc_convert_mmi()
354 mm4 = _mm_add_pi32(mm4, mm5); in jsimd_rgb_ycc_convert_mmi()
[all …]
Djdsample-mmi.c58 mm4 = mm3; \
60 mm4 = _mm_slli_si64(mm4, (SIZEOF_MMWORD - 2) * BYTE_BIT); /* mm4=( - - - 4) */ \
66 mm0 = _mm_or_si64(mm0, mm4); /* mm0=( 1 2 3 4) */ \
73 mm4 = mm3; \
74 mm4 = _mm_srli_si64(mm4, (SIZEOF_MMWORD - 2) * BYTE_BIT); /* mm4=( 7 - - -) */ \
79 wk[r] = mm4; \
114 __m64 mm0, mm1, mm2, mm3 = 0.0, mm4, mm5, mm6, mm7 = 0.0; in jsimd_h2v2_fancy_upsample_mmi() local
152 mm4 = mm0; in jsimd_h2v2_fancy_upsample_mmi()
154 mm4 = _mm_unpackhi_pi8(mm4, mm3); /* mm4 = row[ 0][0]( 4 5 6 7) */ in jsimd_h2v2_fancy_upsample_mmi()
163 mm4 = _mm_mullo_pi16(mm4, PW_THREE); in jsimd_h2v2_fancy_upsample_mmi()
[all …]
Djcsample-mmi.c45 __m64 mm0, mm1, mm2, mm3, mm4, mm5, mm6 = 0.0, mm7; in jsimd_h2v2_downsample_mmi() local
70 mm4 = mm0; in jsimd_h2v2_downsample_mmi()
73 mm4 = _mm_srli_pi16(mm4, BYTE_BIT); in jsimd_h2v2_downsample_mmi()
76 mm0 = _mm_add_pi16(mm0, mm4); in jsimd_h2v2_downsample_mmi()
79 mm4 = mm2; in jsimd_h2v2_downsample_mmi()
82 mm4 = _mm_srli_pi16(mm4, BYTE_BIT); in jsimd_h2v2_downsample_mmi()
85 mm2 = _mm_add_pi16(mm2, mm4); in jsimd_h2v2_downsample_mmi()
Djquanti-mmi.c58 mm4 = mm0; \
67 mm0 = _mm_add_pi16(mm0, mm4); /* reciprocal is always negative */ \
78 mm4 = mm0; \
88 mm6 = _mm_and_si64(mm6, mm4); /* and add input if it is */ \
93 mm4 = _mm_srai_pi16(mm4, (WORD_BIT - 1)); /* then check if... */ \
96 mm4 = _mm_and_si64(mm4, scale0); /* and add scale if it is */ \
98 mm0 = _mm_add_pi16(mm0, mm4); \
119 __m64 mm0, mm1, mm2, mm3, mm4, mm5, mm6, mm7; in jsimd_quantize_mmi() local
/third_party/flutter/skia/third_party/externals/libjpeg-turbo/simd/loongson/
Djdcolext-mmi.c42 #define mmA mm4
56 #define mmC mm4
70 #define mmE mm4
84 #define mmG mm4
98 __m64 mm0, mm1, mm2, mm3, mm4, mm5, mm6, mm7; in jsimd_ycc_rgb_convert_mmi() local
114 mm4 = 0; in jsimd_ycc_rgb_convert_mmi()
116 mm4 = _mm_cmpeq_pi16(mm4, mm4); in jsimd_ycc_rgb_convert_mmi()
118 mm4 = _mm_srli_pi16(mm4, BYTE_BIT); in jsimd_ycc_rgb_convert_mmi()
120 mm0 = mm4; /* mm0=mm4={0xFF 0x00 0xFF 0x00 ..} */ in jsimd_ycc_rgb_convert_mmi()
122 mm4 = _mm_and_si64(mm4, mm5); /* mm4=Cb(0246)=CbE */ in jsimd_ycc_rgb_convert_mmi()
[all …]
Djccolext-mmi.c42 #define mmA mm4
56 #define mmC mm4
70 #define mmE mm4
84 #define mmG mm4
98 __m64 mm0, mm1, mm2, mm3, mm4, mm5, mm6, mm7; in jsimd_rgb_ycc_convert_mmi() local
315 wk[2] = mm4; in jsimd_rgb_ycc_convert_mmi()
322 mm4 = mm6; in jsimd_rgb_ycc_convert_mmi()
326 mm4 = _mm_madd_pi16(mm4, PW_MF016_MF033); in jsimd_rgb_ycc_convert_mmi()
338 mm4 = _mm_add_pi32(mm4, mm6); in jsimd_rgb_ycc_convert_mmi()
340 mm4 = _mm_add_pi32(mm4, mm5); in jsimd_rgb_ycc_convert_mmi()
[all …]
Djdsample-mmi.c58 mm4 = mm3; \
60 mm4 = _mm_slli_si64(mm4, (SIZEOF_MMWORD - 2) * BYTE_BIT); /* mm4=( - - - 4) */ \
66 mm0 = _mm_or_si64(mm0, mm4); /* mm0=( 1 2 3 4) */ \
73 mm4 = mm3; \
74 mm4 = _mm_srli_si64(mm4, (SIZEOF_MMWORD - 2) * BYTE_BIT); /* mm4=( 7 - - -) */ \
79 wk[r] = mm4; \
114 __m64 mm0, mm1, mm2, mm3 = 0.0, mm4, mm5, mm6, mm7 = 0.0; in jsimd_h2v2_fancy_upsample_mmi() local
152 mm4 = mm0; in jsimd_h2v2_fancy_upsample_mmi()
154 mm4 = _mm_unpackhi_pi8(mm4, mm3); /* mm4 = row[ 0][0]( 4 5 6 7) */ in jsimd_h2v2_fancy_upsample_mmi()
163 mm4 = _mm_mullo_pi16(mm4, PW_THREE); in jsimd_h2v2_fancy_upsample_mmi()
[all …]
Djcsample-mmi.c45 __m64 mm0, mm1, mm2, mm3, mm4, mm5, mm6 = 0.0, mm7; in jsimd_h2v2_downsample_mmi() local
70 mm4 = mm0; in jsimd_h2v2_downsample_mmi()
73 mm4 = _mm_srli_pi16(mm4, BYTE_BIT); in jsimd_h2v2_downsample_mmi()
76 mm0 = _mm_add_pi16(mm0, mm4); in jsimd_h2v2_downsample_mmi()
79 mm4 = mm2; in jsimd_h2v2_downsample_mmi()
82 mm4 = _mm_srli_pi16(mm4, BYTE_BIT); in jsimd_h2v2_downsample_mmi()
85 mm2 = _mm_add_pi16(mm2, mm4); in jsimd_h2v2_downsample_mmi()
Djquanti-mmi.c58 mm4 = mm0; \
67 mm0 = _mm_add_pi16(mm0, mm4); /* reciprocal is always negative */ \
78 mm4 = mm0; \
88 mm6 = _mm_and_si64(mm6, mm4); /* and add input if it is */ \
93 mm4 = _mm_srai_pi16(mm4, (WORD_BIT - 1)); /* then check if... */ \
96 mm4 = _mm_and_si64(mm4, scale0); /* and add scale if it is */ \
98 mm0 = _mm_add_pi16(mm0, mm4); \
119 __m64 mm0, mm1, mm2, mm3, mm4, mm5, mm6, mm7; in jsimd_quantize_mmi() local
/third_party/ffmpeg/libavcodec/x86/
Dsimple_idct.asm87 movq mm4, [wm1010]
88 pand mm4, mm0
89 por mm4, mm1
90 por mm4, mm2
91 por mm4, mm3
92 packssdw mm4, mm4
93 movd t0d, mm4
96 movq mm4, [coeffs + 16] ; C4 C4 C4 C4
97 pmaddwd mm4, mm0 ; C4R4+C4R0 C4r4+C4r0
106 paddd mm4, [coeffs + 8]
[all …]
Dhpeldsp_rnd_template.c42 PAVGBP(%%mm0, %%mm1, %%mm4, %%mm2, %%mm3, %%mm5) in DEF()
51 PAVGBP(%%mm0, %%mm1, %%mm4, %%mm2, %%mm3, %%mm5) in DEF()
74 PAVGBP(%%mm0, %%mm1, %%mm4, %%mm2, %%mm3, %%mm5) in DEF()
81 PAVGBP(%%mm0, %%mm1, %%mm4, %%mm2, %%mm3, %%mm5) in DEF()
90 PAVGBP(%%mm0, %%mm1, %%mm4, %%mm2, %%mm3, %%mm5) in DEF()
97 PAVGBP(%%mm0, %%mm1, %%mm4, %%mm2, %%mm3, %%mm5) in DEF()
119 PAVGBP(%%mm1, %%mm0, %%mm4, %%mm2, %%mm1, %%mm5) in DEF()
126 PAVGBP(%%mm1, %%mm2, %%mm4, %%mm0, %%mm1, %%mm5) in DEF()
175 PAVGBP(%%mm1, %%mm0, %%mm4, %%mm2, %%mm1, %%mm5) in DEF()
177 PAVGB_MMX(%%mm3, %%mm4, %%mm0, %%mm6) in DEF()
[all …]
Dh264_intrapred.asm207 movd mm4, r2d
208 SPLATW mm4, mm4, 0
209 movq mm5, mm4
210 movq mm6, mm4
211 movq mm7, mm4
212 paddw mm4, mm0
216 packuswb mm4, mm5
218 movq [r0+r1+0], mm4
956 movd mm4, r3d
958 SPLATW mm4, mm4, 0
[all …]
Dhuffyuvdsp.asm109 movd mm4, [left_topq]
112 por mm4, mm2
114 psubw mm0, mm4 ; t-tl
121 movq mm4, [topq+wq]
122 movq mm0, mm4
123 psllq mm4, 16
124 por mm4, mm1
126 psubw mm0, mm4 ; t-tl
131 movq mm4, mm0
132 paddw mm4, mm3 ; t-tl+l
[all …]
/third_party/flutter/skia/third_party/externals/libjpeg-turbo/simd/i386/
Djccolext-mmx.asm267 ; mm0=(R0 R2 R4 R6)=RE, mm2=(G0 G2 G4 G6)=GE, mm4=(B0 B2 B4 B6)=BE
282 movq MMWORD [wk(2)], mm4 ; wk(2)=BE
289 movq mm4, mm6
293 pmaddwd mm4, [GOTOFF(eax,PW_MF016_MF033)] ; mm4=ROH*-FIX(0.168)+GOH*-FIX(0.331)
308 paddd mm4, mm6
310 paddd mm4, mm5
312 psrld mm4, SCALEBITS ; mm4=CbOH
313 packssdw mm7, mm4 ; mm7=CbO
321 movq mm4, mm6
325 pmaddwd mm4, [GOTOFF(eax,PW_MF016_MF033)] ; mm4=REH*-FIX(0.168)+GEH*-FIX(0.331)
[all …]
Djdcolext-mmx.asm105 pcmpeqw mm4, mm4
107 psrlw mm4, BYTE_BIT
109 movq mm0, mm4 ; mm0=mm4={0xFF 0x00 0xFF 0x00 ..}
111 pand mm4, mm5 ; mm4=Cb(0246)=CbE
116 paddw mm4, mm7
131 movq mm2, mm4 ; mm2=CbE
133 paddw mm4, mm4 ; mm4=2*CbE
140 pmulhw mm4, [GOTOFF(eax,PW_MF0228)] ; mm4=(2*CbE * -FIX(0.22800))
145 paddw mm4, [GOTOFF(eax,PW_ONE)]
147 psraw mm4, 1 ; mm4=(CbE * -FIX(0.22800))
[all …]
Djquant-3dn.asm73 punpcklwd mm4, mm2 ; mm4=(***0***1)
78 psrad mm4, (DWORD_BIT-BYTE_BIT) ; mm4=(01)
80 pi2fd mm4, mm4
87 movq MMWORD [MMBLOCK(0,0,edi,SIZEOF_FAST_FLOAT)], mm4
94 punpcklwd mm4, mm1 ; mm4=(***C***D)
101 psrad mm4, (DWORD_BIT-BYTE_BIT) ; mm4=(CD)
103 pi2fd mm4, mm4
108 movq MMWORD [MMBLOCK(1,2,edi,SIZEOF_FAST_FLOAT)], mm4
175 movq mm4, mm0
177 punpckhwd mm4, mm1 ; mm4=(01 03 ** **)
[all …]
/third_party/skia/third_party/externals/libjpeg-turbo/simd/i386/
Djccolext-mmx.asm265 ; mm0=(R0 R2 R4 R6)=RE, mm2=(G0 G2 G4 G6)=GE, mm4=(B0 B2 B4 B6)=BE
280 movq MMWORD [wk(2)], mm4 ; wk(2)=BE
287 movq mm4, mm6
291 pmaddwd mm4, [GOTOFF(eax,PW_MF016_MF033)] ; mm4=ROH*-FIX(0.168)+GOH*-FIX(0.331)
306 paddd mm4, mm6
308 paddd mm4, mm5
310 psrld mm4, SCALEBITS ; mm4=CbOH
311 packssdw mm7, mm4 ; mm7=CbO
319 movq mm4, mm6
323 pmaddwd mm4, [GOTOFF(eax,PW_MF016_MF033)] ; mm4=REH*-FIX(0.168)+GEH*-FIX(0.331)
[all …]
Djdcolext-mmx.asm103 pcmpeqw mm4, mm4
105 psrlw mm4, BYTE_BIT
107 movq mm0, mm4 ; mm0=mm4={0xFF 0x00 0xFF 0x00 ..}
109 pand mm4, mm5 ; mm4=Cb(0246)=CbE
114 paddw mm4, mm7
129 movq mm2, mm4 ; mm2=CbE
131 paddw mm4, mm4 ; mm4=2*CbE
138 pmulhw mm4, [GOTOFF(eax,PW_MF0228)] ; mm4=(2*CbE * -FIX(0.22800))
143 paddw mm4, [GOTOFF(eax,PW_ONE)]
145 psraw mm4, 1 ; mm4=(CbE * -FIX(0.22800))
[all …]
Djquant-3dn.asm71 punpcklwd mm4, mm2 ; mm4=(***0***1)
76 psrad mm4, (DWORD_BIT-BYTE_BIT) ; mm4=(01)
78 pi2fd mm4, mm4
85 movq MMWORD [MMBLOCK(0,0,edi,SIZEOF_FAST_FLOAT)], mm4
92 punpcklwd mm4, mm1 ; mm4=(***C***D)
99 psrad mm4, (DWORD_BIT-BYTE_BIT) ; mm4=(CD)
101 pi2fd mm4, mm4
106 movq MMWORD [MMBLOCK(1,2,edi,SIZEOF_FAST_FLOAT)], mm4
173 movq mm4, mm0
175 punpckhwd mm4, mm1 ; mm4=(01 03 ** **)
[all …]
/third_party/libjpeg-turbo/simd/i386/
Djccolext-mmx.asm265 ; mm0=(R0 R2 R4 R6)=RE, mm2=(G0 G2 G4 G6)=GE, mm4=(B0 B2 B4 B6)=BE
280 movq MMWORD [wk(2)], mm4 ; wk(2)=BE
287 movq mm4, mm6
291 pmaddwd mm4, [GOTOFF(eax,PW_MF016_MF033)] ; mm4=ROH*-FIX(0.168)+GOH*-FIX(0.331)
306 paddd mm4, mm6
308 paddd mm4, mm5
310 psrld mm4, SCALEBITS ; mm4=CbOH
311 packssdw mm7, mm4 ; mm7=CbO
319 movq mm4, mm6
323 pmaddwd mm4, [GOTOFF(eax,PW_MF016_MF033)] ; mm4=REH*-FIX(0.168)+GEH*-FIX(0.331)
[all …]
Djdcolext-mmx.asm103 pcmpeqw mm4, mm4
105 psrlw mm4, BYTE_BIT
107 movq mm0, mm4 ; mm0=mm4={0xFF 0x00 0xFF 0x00 ..}
109 pand mm4, mm5 ; mm4=Cb(0246)=CbE
114 paddw mm4, mm7
129 movq mm2, mm4 ; mm2=CbE
131 paddw mm4, mm4 ; mm4=2*CbE
138 pmulhw mm4, [GOTOFF(eax,PW_MF0228)] ; mm4=(2*CbE * -FIX(0.22800))
143 paddw mm4, [GOTOFF(eax,PW_ONE)]
145 psraw mm4, 1 ; mm4=(CbE * -FIX(0.22800))
[all …]
Djquant-3dn.asm71 punpcklwd mm4, mm2 ; mm4=(***0***1)
76 psrad mm4, (DWORD_BIT-BYTE_BIT) ; mm4=(01)
78 pi2fd mm4, mm4
85 movq MMWORD [MMBLOCK(0,0,edi,SIZEOF_FAST_FLOAT)], mm4
92 punpcklwd mm4, mm1 ; mm4=(***C***D)
99 psrad mm4, (DWORD_BIT-BYTE_BIT) ; mm4=(CD)
101 pi2fd mm4, mm4
106 movq MMWORD [MMBLOCK(1,2,edi,SIZEOF_FAST_FLOAT)], mm4
173 movq mm4, mm0
175 punpckhwd mm4, mm1 ; mm4=(01 03 ** **)
[all …]
/third_party/gstreamer/gstplugins_good/gst/deinterlace/tvtime/tomsmocomp/
DWierdBob.inc41 "pxor %%mm4, %%mm4\n\t"
42 "pcmpeqb %%mm4, %%mm3\n\t" // now ff where new better, else 00
43 "pcmpeqb %%mm3, %%mm4\n\t" // here ff where old better, else 00
48 "pand %%mm4, %%mm6\n\t"
49 "pand %%mm4, %%mm7\n\t"
69 "pxor %%mm4, %%mm4\n\t"
70 "pcmpeqb %%mm4, %%mm3\n\t" // now ff where new better, else 00
71 "pcmpeqb %%mm3, %%mm4\n\t" // here ff where old better, else 00
76 "pand %%mm4, %%mm6\n\t"
77 "pand %%mm4, %%mm7\n\t"
[all …]
/third_party/mesa3d/src/mesa/x86/
Dread_rgba_span_x86.S131 movq %mm0, %mm4
134 psllq $16, %mm4
136 pand %mm2, %mm4
139 por %mm4, %mm3
231 movq %mm0, %mm4
234 psllq $16, %mm4
236 pand %mm2, %mm4
239 por %mm4, %mm3
264 movq %mm0, %mm4
271 psllq $16, %mm4
[all …]

1234