216 |
CONSIM_1x8_SSE2 |
CONSIM_1x8_SSE2 |
217 |
|
|
218 |
;accumulate xmm5-7 |
;accumulate xmm5-7 |
219 |
pshufd xmm0, xmm5, 0EH |
pshufd xmm0, xmm5, 0x0E |
220 |
paddd xmm5, xmm0 |
paddd xmm5, xmm0 |
221 |
pshufd xmm0, xmm5, 01H |
pshufd xmm0, xmm5, 0x01 |
222 |
paddd xmm5, xmm0 |
paddd xmm5, xmm0 |
223 |
|
|
224 |
pshufd xmm1, xmm6, 0EH |
pshufd xmm1, xmm6, 0x0E |
225 |
paddd xmm6, xmm1 |
paddd xmm6, xmm1 |
226 |
pshufd xmm1, xmm6, 01H |
pshufd xmm1, xmm6, 0x01 |
227 |
paddd xmm6, xmm1 |
paddd xmm6, xmm1 |
228 |
|
|
229 |
pshufd xmm2, xmm7, 0EH |
pshufd xmm2, xmm7, 0x0E |
230 |
paddd xmm7, xmm2 |
paddd xmm7, xmm2 |
231 |
pshufd xmm2, xmm7, 01H |
pshufd xmm2, xmm7, 0x01 |
232 |
paddd xmm7, xmm2 |
paddd xmm7, xmm2 |
233 |
|
|
234 |
CONSIM_WRITEOUT xmm5,xmm6,xmm7 |
CONSIM_WRITEOUT xmm5,xmm6,xmm7 |
285 |
CONSIM_WRITEOUT mm5,mm6,mm7 |
CONSIM_WRITEOUT mm5,mm6,mm7 |
286 |
ret |
ret |
287 |
.endfunc |
.endfunc |
288 |
|
|
289 |
|
%ifidn __OUTPUT_FORMAT__,elf |
290 |
|
section ".note.GNU-stack" noalloc noexec nowrite progbits |
291 |
|
%endif |