mirror of
https://chromium.googlesource.com/libyuv/libyuv
synced 2025-12-07 17:26:49 +08:00
Polynomial AVX2 on gcc use vex128 vmovq instead of SSE2 movq to avoid stall.
BUG=265 TEST=unittest polynomial R=ryanpetrie@google.com Review URL: https://webrtc-codereview.appspot.com/2679004 git-svn-id: http://libyuv.googlecode.com/svn/trunk@816 16f28f9a-4ce2-e073-06de-1de4eb20be90
This commit is contained in:
parent
a03b8adde8
commit
78ad8d1f98
@ -6068,7 +6068,7 @@ void ARGBPolynomialRow_AVX2(const uint8* src_argb,
|
||||
"vpermq $0xd8,%%ymm0,%%ymm0 \n"
|
||||
"vpackuswb %%xmm0,%%xmm0,%%xmm0 \n"
|
||||
"sub $0x2,%2 \n"
|
||||
"movq %%xmm0,"MEMACCESS(1)" \n"
|
||||
"vmovq %%xmm0,"MEMACCESS(1)" \n"
|
||||
"lea "MEMLEA(0x8,1)",%1 \n"
|
||||
"jg 1b \n"
|
||||
"vzeroupper \n"
|
||||
|
||||
Loading…
x
Reference in New Issue
Block a user