; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $62, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $2, %k0, %k1
; X32-NEXT: movl %eax, %ecx
; X32-NEXT: andb $15, %cl
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $61, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $3, %k0, %k1
; X32-NEXT: shrb $3, %cl
; X32-NEXT: kmovd %ecx, %k2
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $60, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $4, %k0, %k1
; X32-NEXT: movl %eax, %ecx
; X32-NEXT: shrb $4, %cl
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $59, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $5, %k0, %k1
; X32-NEXT: movl %eax, %ecx
; X32-NEXT: shrb $5, %cl
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $58, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $6, %k0, %k1
; X32-NEXT: movl %eax, %ecx
; X32-NEXT: shrb $6, %cl
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $57, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $7, %k0, %k1
; X32-NEXT: movl %eax, %ecx
; X32-NEXT: shrb $7, %cl
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $56, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $8, %k0, %k1
; X32-NEXT: movb %ah, %cl
; X32-NEXT: kmovd %ecx, %k2
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $55, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $9, %k0, %k1
; X32-NEXT: andb $2, %cl
; X32-NEXT: shrb %cl
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $54, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $10, %k0, %k1
; X32-NEXT: movb %ah, %cl
; X32-NEXT: movl %eax, %esi
; X32-NEXT: movl {{[0-9]+}}(%esp), %ebx
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $53, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $11, %k0, %k1
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $52, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $12, %k0, %k1
; X32-NEXT: kxorq %k3, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $51, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $13, %k0, %k1
; X32-NEXT: kxorq %k4, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $50, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $14, %k0, %k1
; X32-NEXT: kxorq %k5, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $49, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $15, %k0, %k1
; X32-NEXT: shrl $15, %edx
; X32-NEXT: kmovd %edx, %k2
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $48, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $16, %k0, %k1
; X32-NEXT: kmovd %eax, %k2
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $47, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $17, %k0, %k1
; X32-NEXT: kxorq %k6, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $46, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $18, %k0, %k1
; X32-NEXT: kxorq %k7, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $45, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $19, %k0, %k1
; X32-NEXT: shrb $3, %cl
; X32-NEXT: kmovd %ecx, %k2
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $44, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $20, %k0, %k1
; X32-NEXT: movl %eax, %ecx
; X32-NEXT: shrb $4, %cl
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $43, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $21, %k0, %k1
; X32-NEXT: movl %eax, %ecx
; X32-NEXT: shrb $5, %cl
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $42, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $22, %k0, %k1
; X32-NEXT: movl %eax, %ecx
; X32-NEXT: shrb $6, %cl
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $41, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $23, %k0, %k1
; X32-NEXT: shrb $7, %al
; X32-NEXT: kmovd %eax, %k2
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $40, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $24, %k0, %k1
; X32-NEXT: movl %esi, %edx
; X32-NEXT: shrl $24, %edx
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $39, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $25, %k0, %k1
; X32-NEXT: movl %edx, %eax
; X32-NEXT: andb $2, %al
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $38, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $26, %k0, %k1
; X32-NEXT: andb $15, %dl
; X32-NEXT: movl %edx, %eax
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $37, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $27, %k0, %k1
; X32-NEXT: shrb $3, %dl
; X32-NEXT: kmovd %edx, %k2
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $36, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $28, %k0, %k1
; X32-NEXT: movl %esi, %ecx
; X32-NEXT: movl %ecx, %eax
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $35, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $29, %k0, %k1
; X32-NEXT: movl %ecx, %eax
; X32-NEXT: shrl $29, %eax
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $34, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $30, %k0, %k1
; X32-NEXT: movl %ecx, %eax
; X32-NEXT: shrl $30, %eax
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $33, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $31, %k0, %k1
; X32-NEXT: shrl $31, %ecx
; X32-NEXT: kmovd %ecx, %k2
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $32, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $32, %k0, %k1
; X32-NEXT: kmovd %ebx, %k2
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $31, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $33, %k0, %k1
; X32-NEXT: movl %ebx, %eax
; X32-NEXT: andb $2, %al
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $30, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $34, %k0, %k1
; X32-NEXT: movl %ebx, %eax
; X32-NEXT: andb $15, %al
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $29, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $35, %k0, %k1
; X32-NEXT: shrb $3, %al
; X32-NEXT: kmovd %eax, %k2
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $28, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $36, %k0, %k1
; X32-NEXT: movl %ebx, %eax
; X32-NEXT: shrb $4, %al
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $27, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $37, %k0, %k1
; X32-NEXT: movl %ebx, %eax
; X32-NEXT: shrb $5, %al
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $26, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $38, %k0, %k1
; X32-NEXT: movl %ebx, %eax
; X32-NEXT: shrb $6, %al
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $25, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $39, %k0, %k1
; X32-NEXT: movl %ebx, %eax
; X32-NEXT: shrb $7, %al
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $24, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $40, %k0, %k1
; X32-NEXT: movb %bh, %al
; X32-NEXT: kmovd %eax, %k2
; X32-NEXT: kmovd %eax, %k7
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $23, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $41, %k0, %k1
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $22, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $42, %k0, %k1
; X32-NEXT: kxorq %k3, %k1, %k1
; X32-NEXT: movzwl %bx, %eax
; X32-NEXT: kmovd %esi, %k3
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $21, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $43, %k0, %k1
; X32-NEXT: kxorq %k4, %k1, %k1
; X32-NEXT: shrl $15, %eax
; X32-NEXT: kmovd %eax, %k4
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $20, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $44, %k0, %k1
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $19, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $45, %k0, %k1
; X32-NEXT: kxorq %k5, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $18, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $46, %k0, %k1
; X32-NEXT: kxorq %k3, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $17, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $47, %k0, %k1
; X32-NEXT: kxorq %k4, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $16, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $48, %k0, %k1
; X32-NEXT: kmovd %ecx, %k2
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $15, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $49, %k0, %k1
; X32-NEXT: kxorq %k6, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $14, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $50, %k0, %k1
; X32-NEXT: kxorq %k7, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $13, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $51, %k0, %k1
; X32-NEXT: shrb $3, %dl
; X32-NEXT: kmovd %edx, %k2
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $12, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k4
+; X32-NEXT: kxorq %k1, %k0, %k4
; X32-NEXT: kshiftrq $52, %k4, %k0
; X32-NEXT: movl %ecx, %eax
; X32-NEXT: shrb $4, %al
; X32-NEXT: kmovd %eax, %k3
; X32-NEXT: kshiftlq $63, %k5, %k5
; X32-NEXT: kshiftrq $11, %k5, %k5
-; X32-NEXT: kxorq %k4, %k5, %k4
+; X32-NEXT: kxorq %k5, %k4, %k4
; X32-NEXT: kshiftrq $53, %k4, %k5
; X32-NEXT: kxorq %k6, %k5, %k5
; X32-NEXT: kshiftlq $63, %k5, %k5
; X32-NEXT: kshiftrq $10, %k5, %k5
-; X32-NEXT: kxorq %k4, %k5, %k5
+; X32-NEXT: kxorq %k5, %k4, %k5
; X32-NEXT: kshiftrq $54, %k5, %k4
; X32-NEXT: kxorq %k7, %k4, %k6
; X32-NEXT: shrb $3, %cl
; X32-NEXT: kmovd %eax, %k7
; X32-NEXT: kshiftlq $63, %k6, %k6
; X32-NEXT: kshiftrq $9, %k6, %k6
-; X32-NEXT: kxorq %k5, %k6, %k5
+; X32-NEXT: kxorq %k6, %k5, %k5
; X32-NEXT: kshiftrq $55, %k5, %k6
; X32-NEXT: kxorq %k0, %k6, %k0
; X32-NEXT: kshiftlq $63, %k0, %k0
; X32-NEXT: kshiftrq $8, %k0, %k0
-; X32-NEXT: kxorq %k5, %k0, %k0
+; X32-NEXT: kxorq %k0, %k5, %k0
; X32-NEXT: kshiftrq $56, %k0, %k5
; X32-NEXT: kxorq %k1, %k5, %k1
; X32-NEXT: movl %ebx, %eax
; X32-NEXT: kmovd %eax, %k6
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $7, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $57, %k0, %k1
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $6, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $58, %k0, %k1
; X32-NEXT: kxorq %k3, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $5, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $59, %k0, %k1
; X32-NEXT: kxorq %k4, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $4, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $60, %k0, %k1
; X32-NEXT: kxorq %k5, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $3, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $61, %k0, %k1
; X32-NEXT: kxorq %k7, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $2, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $62, %k0, %k1
; X32-NEXT: kxorq %k6, %k1, %k1
; X32-NEXT: shrl $31, %ebx
; X32-NEXT: movb {{[0-9]+}}(%esp), %al
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $1, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftlq $1, %k0, %k0
; X32-NEXT: kshiftrq $1, %k0, %k0
; X32-NEXT: kshiftlq $63, %k2, %k1
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $62, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $2, %k0, %k1
; X32-NEXT: movl %eax, %ecx
; X32-NEXT: andb $15, %cl
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $61, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $3, %k0, %k1
; X32-NEXT: shrb $3, %cl
; X32-NEXT: kmovd %ecx, %k2
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $60, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $4, %k0, %k1
; X32-NEXT: movl %eax, %ecx
; X32-NEXT: shrb $4, %cl
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $59, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $5, %k0, %k1
; X32-NEXT: movl %eax, %ecx
; X32-NEXT: shrb $5, %cl
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $58, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $6, %k0, %k1
; X32-NEXT: movl %eax, %ecx
; X32-NEXT: shrb $6, %cl
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $57, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $7, %k0, %k1
; X32-NEXT: movl %eax, %ecx
; X32-NEXT: shrb $7, %cl
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $56, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $8, %k0, %k1
; X32-NEXT: movb %ah, %cl
; X32-NEXT: kmovd %ecx, %k2
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $55, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $9, %k0, %k1
; X32-NEXT: andb $2, %cl
; X32-NEXT: shrb %cl
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $54, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $10, %k0, %k1
; X32-NEXT: movb %ah, %cl
; X32-NEXT: movl %eax, %esi
; X32-NEXT: movl {{[0-9]+}}(%esp), %ebx
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $53, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $11, %k0, %k1
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $52, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $12, %k0, %k1
; X32-NEXT: kxorq %k3, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $51, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $13, %k0, %k1
; X32-NEXT: kxorq %k4, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $50, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $14, %k0, %k1
; X32-NEXT: kxorq %k5, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $49, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $15, %k0, %k1
; X32-NEXT: shrl $15, %edx
; X32-NEXT: kmovd %edx, %k2
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $48, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $16, %k0, %k1
; X32-NEXT: kmovd %eax, %k2
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $47, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $17, %k0, %k1
; X32-NEXT: kxorq %k6, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $46, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $18, %k0, %k1
; X32-NEXT: kxorq %k7, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $45, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $19, %k0, %k1
; X32-NEXT: shrb $3, %cl
; X32-NEXT: kmovd %ecx, %k2
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $44, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $20, %k0, %k1
; X32-NEXT: movl %eax, %ecx
; X32-NEXT: shrb $4, %cl
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $43, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $21, %k0, %k1
; X32-NEXT: movl %eax, %ecx
; X32-NEXT: shrb $5, %cl
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $42, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $22, %k0, %k1
; X32-NEXT: movl %eax, %ecx
; X32-NEXT: shrb $6, %cl
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $41, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $23, %k0, %k1
; X32-NEXT: shrb $7, %al
; X32-NEXT: kmovd %eax, %k2
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $40, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $24, %k0, %k1
; X32-NEXT: movl %esi, %edx
; X32-NEXT: shrl $24, %edx
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $39, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $25, %k0, %k1
; X32-NEXT: movl %edx, %eax
; X32-NEXT: andb $2, %al
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $38, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $26, %k0, %k1
; X32-NEXT: andb $15, %dl
; X32-NEXT: movl %edx, %eax
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $37, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $27, %k0, %k1
; X32-NEXT: shrb $3, %dl
; X32-NEXT: kmovd %edx, %k2
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $36, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $28, %k0, %k1
; X32-NEXT: movl %esi, %ecx
; X32-NEXT: movl %ecx, %eax
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $35, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $29, %k0, %k1
; X32-NEXT: movl %ecx, %eax
; X32-NEXT: shrl $29, %eax
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $34, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $30, %k0, %k1
; X32-NEXT: movl %ecx, %eax
; X32-NEXT: shrl $30, %eax
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $33, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $31, %k0, %k1
; X32-NEXT: shrl $31, %ecx
; X32-NEXT: kmovd %ecx, %k2
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $32, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $32, %k0, %k1
; X32-NEXT: kmovd %ebx, %k2
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $31, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $33, %k0, %k1
; X32-NEXT: movl %ebx, %eax
; X32-NEXT: andb $2, %al
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $30, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $34, %k0, %k1
; X32-NEXT: movl %ebx, %eax
; X32-NEXT: andb $15, %al
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $29, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $35, %k0, %k1
; X32-NEXT: shrb $3, %al
; X32-NEXT: kmovd %eax, %k2
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $28, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $36, %k0, %k1
; X32-NEXT: movl %ebx, %eax
; X32-NEXT: shrb $4, %al
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $27, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $37, %k0, %k1
; X32-NEXT: movl %ebx, %eax
; X32-NEXT: shrb $5, %al
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $26, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $38, %k0, %k1
; X32-NEXT: movl %ebx, %eax
; X32-NEXT: shrb $6, %al
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $25, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $39, %k0, %k1
; X32-NEXT: movl %ebx, %eax
; X32-NEXT: shrb $7, %al
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $24, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $40, %k0, %k1
; X32-NEXT: movb %bh, %al
; X32-NEXT: kmovd %eax, %k2
; X32-NEXT: kmovd %eax, %k7
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $23, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $41, %k0, %k1
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $22, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $42, %k0, %k1
; X32-NEXT: kxorq %k3, %k1, %k1
; X32-NEXT: movzwl %bx, %eax
; X32-NEXT: kmovd %esi, %k3
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $21, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $43, %k0, %k1
; X32-NEXT: kxorq %k4, %k1, %k1
; X32-NEXT: shrl $15, %eax
; X32-NEXT: kmovd %eax, %k4
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $20, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $44, %k0, %k1
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $19, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $45, %k0, %k1
; X32-NEXT: kxorq %k5, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $18, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $46, %k0, %k1
; X32-NEXT: kxorq %k3, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $17, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $47, %k0, %k1
; X32-NEXT: kxorq %k4, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $16, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $48, %k0, %k1
; X32-NEXT: kmovd %ecx, %k2
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $15, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $49, %k0, %k1
; X32-NEXT: kxorq %k6, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $14, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $50, %k0, %k1
; X32-NEXT: kxorq %k7, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $13, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $51, %k0, %k1
; X32-NEXT: shrb $3, %dl
; X32-NEXT: kmovd %edx, %k2
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $12, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k4
+; X32-NEXT: kxorq %k1, %k0, %k4
; X32-NEXT: kshiftrq $52, %k4, %k0
; X32-NEXT: movl %ecx, %eax
; X32-NEXT: shrb $4, %al
; X32-NEXT: kmovd %eax, %k3
; X32-NEXT: kshiftlq $63, %k5, %k5
; X32-NEXT: kshiftrq $11, %k5, %k5
-; X32-NEXT: kxorq %k4, %k5, %k4
+; X32-NEXT: kxorq %k5, %k4, %k4
; X32-NEXT: kshiftrq $53, %k4, %k5
; X32-NEXT: kxorq %k6, %k5, %k5
; X32-NEXT: kshiftlq $63, %k5, %k5
; X32-NEXT: kshiftrq $10, %k5, %k5
-; X32-NEXT: kxorq %k4, %k5, %k5
+; X32-NEXT: kxorq %k5, %k4, %k5
; X32-NEXT: kshiftrq $54, %k5, %k4
; X32-NEXT: kxorq %k7, %k4, %k6
; X32-NEXT: shrb $3, %cl
; X32-NEXT: kmovd %eax, %k7
; X32-NEXT: kshiftlq $63, %k6, %k6
; X32-NEXT: kshiftrq $9, %k6, %k6
-; X32-NEXT: kxorq %k5, %k6, %k5
+; X32-NEXT: kxorq %k6, %k5, %k5
; X32-NEXT: kshiftrq $55, %k5, %k6
; X32-NEXT: kxorq %k0, %k6, %k0
; X32-NEXT: kshiftlq $63, %k0, %k0
; X32-NEXT: kshiftrq $8, %k0, %k0
-; X32-NEXT: kxorq %k5, %k0, %k0
+; X32-NEXT: kxorq %k0, %k5, %k0
; X32-NEXT: kshiftrq $56, %k0, %k5
; X32-NEXT: kxorq %k1, %k5, %k1
; X32-NEXT: movl %ebx, %eax
; X32-NEXT: kmovd %eax, %k6
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $7, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $57, %k0, %k1
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $6, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $58, %k0, %k1
; X32-NEXT: kxorq %k3, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $5, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $59, %k0, %k1
; X32-NEXT: kxorq %k4, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $4, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $60, %k0, %k1
; X32-NEXT: kxorq %k5, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $3, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $61, %k0, %k1
; X32-NEXT: kxorq %k7, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $2, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $62, %k0, %k1
; X32-NEXT: kxorq %k6, %k1, %k1
; X32-NEXT: shrl $31, %ebx
; X32-NEXT: movb {{[0-9]+}}(%esp), %al
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $1, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftlq $1, %k0, %k0
; X32-NEXT: kshiftrq $1, %k0, %k0
; X32-NEXT: kshiftlq $63, %k2, %k1
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $62, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $2, %k0, %k1
; X32-NEXT: movl %eax, %ecx
; X32-NEXT: andb $15, %cl
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $61, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $3, %k0, %k1
; X32-NEXT: shrb $3, %cl
; X32-NEXT: kmovd %ecx, %k2
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $60, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $4, %k0, %k1
; X32-NEXT: movl %eax, %ecx
; X32-NEXT: shrb $4, %cl
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $59, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $5, %k0, %k1
; X32-NEXT: movl %eax, %ecx
; X32-NEXT: shrb $5, %cl
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $58, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $6, %k0, %k1
; X32-NEXT: movl %eax, %ecx
; X32-NEXT: shrb $6, %cl
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $57, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $7, %k0, %k1
; X32-NEXT: movl %eax, %ecx
; X32-NEXT: shrb $7, %cl
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $56, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $8, %k0, %k1
; X32-NEXT: movb %ah, %cl
; X32-NEXT: kmovd %ecx, %k2
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $55, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $9, %k0, %k1
; X32-NEXT: andb $2, %cl
; X32-NEXT: shrb %cl
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $54, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $10, %k0, %k1
; X32-NEXT: movb %ah, %cl
; X32-NEXT: movl %eax, %esi
; X32-NEXT: movl 12(%ebp), %ebx
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $53, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $11, %k0, %k1
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $52, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $12, %k0, %k1
; X32-NEXT: kxorq %k3, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $51, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $13, %k0, %k1
; X32-NEXT: kxorq %k4, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $50, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $14, %k0, %k1
; X32-NEXT: kxorq %k5, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $49, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $15, %k0, %k1
; X32-NEXT: shrl $15, %edx
; X32-NEXT: kmovd %edx, %k2
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $48, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $16, %k0, %k1
; X32-NEXT: kmovd %eax, %k2
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $47, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $17, %k0, %k1
; X32-NEXT: kxorq %k6, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $46, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $18, %k0, %k1
; X32-NEXT: kxorq %k7, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $45, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $19, %k0, %k1
; X32-NEXT: shrb $3, %cl
; X32-NEXT: kmovd %ecx, %k2
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $44, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $20, %k0, %k1
; X32-NEXT: movl %eax, %ecx
; X32-NEXT: shrb $4, %cl
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $43, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $21, %k0, %k1
; X32-NEXT: movl %eax, %ecx
; X32-NEXT: shrb $5, %cl
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $42, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $22, %k0, %k1
; X32-NEXT: movl %eax, %ecx
; X32-NEXT: shrb $6, %cl
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $41, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $23, %k0, %k1
; X32-NEXT: shrb $7, %al
; X32-NEXT: kmovd %eax, %k2
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $40, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $24, %k0, %k1
; X32-NEXT: movl %esi, %edx
; X32-NEXT: shrl $24, %edx
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $39, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $25, %k0, %k1
; X32-NEXT: movl %edx, %eax
; X32-NEXT: andb $2, %al
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $38, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $26, %k0, %k1
; X32-NEXT: andb $15, %dl
; X32-NEXT: movl %edx, %eax
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $37, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $27, %k0, %k1
; X32-NEXT: shrb $3, %dl
; X32-NEXT: kmovd %edx, %k2
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $36, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $28, %k0, %k1
; X32-NEXT: movl %esi, %ecx
; X32-NEXT: movl %ecx, %eax
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $35, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $29, %k0, %k1
; X32-NEXT: movl %ecx, %eax
; X32-NEXT: shrl $29, %eax
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $34, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $30, %k0, %k1
; X32-NEXT: movl %ecx, %eax
; X32-NEXT: shrl $30, %eax
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $33, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $31, %k0, %k1
; X32-NEXT: shrl $31, %ecx
; X32-NEXT: kmovd %ecx, %k2
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $32, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $32, %k0, %k1
; X32-NEXT: kmovd %ebx, %k2
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $31, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $33, %k0, %k1
; X32-NEXT: movl %ebx, %eax
; X32-NEXT: andb $2, %al
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $30, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $34, %k0, %k1
; X32-NEXT: movl %ebx, %eax
; X32-NEXT: andb $15, %al
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $29, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $35, %k0, %k1
; X32-NEXT: shrb $3, %al
; X32-NEXT: kmovd %eax, %k2
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $28, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $36, %k0, %k1
; X32-NEXT: movl %ebx, %eax
; X32-NEXT: shrb $4, %al
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $27, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $37, %k0, %k1
; X32-NEXT: movl %ebx, %eax
; X32-NEXT: shrb $5, %al
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $26, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $38, %k0, %k1
; X32-NEXT: movl %ebx, %eax
; X32-NEXT: shrb $6, %al
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $25, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $39, %k0, %k1
; X32-NEXT: movl %ebx, %eax
; X32-NEXT: shrb $7, %al
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $24, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $40, %k0, %k1
; X32-NEXT: movb %bh, %al
; X32-NEXT: kmovd %eax, %k2
; X32-NEXT: kmovd %eax, %k7
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $23, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $41, %k0, %k1
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $22, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $42, %k0, %k1
; X32-NEXT: kxorq %k3, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $21, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $43, %k0, %k1
; X32-NEXT: kxorq %k4, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $20, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $44, %k0, %k1
; X32-NEXT: movzwl %bx, %eax
; X32-NEXT: movl %eax, %esi
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $19, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $45, %k0, %k1
; X32-NEXT: kxorq %k5, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $18, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $46, %k0, %k1
; X32-NEXT: movl %eax, %esi
; X32-NEXT: shrl $14, %esi
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $17, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $47, %k0, %k1
; X32-NEXT: shrl $15, %eax
; X32-NEXT: kmovd %eax, %k2
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $16, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $48, %k0, %k1
; X32-NEXT: kmovd %ecx, %k2
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $15, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $49, %k0, %k1
; X32-NEXT: kxorq %k6, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $14, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $50, %k0, %k1
; X32-NEXT: kxorq %k7, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $13, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $51, %k0, %k1
; X32-NEXT: shrb $3, %dl
; X32-NEXT: kmovd %edx, %k2
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $12, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $52, %k0, %k1
; X32-NEXT: movl %ecx, %eax
; X32-NEXT: shrb $4, %al
; X32-NEXT: kmovd %eax, %k7
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $11, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $53, %k0, %k1
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $10, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $54, %k0, %k1
; X32-NEXT: kxorq %k3, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $9, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $55, %k0, %k1
; X32-NEXT: kxorq %k4, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $8, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $56, %k0, %k1
; X32-NEXT: kxorq %k5, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $7, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $57, %k0, %k1
; X32-NEXT: kxorq %k6, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $6, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $58, %k0, %k1
; X32-NEXT: kxorq %k7, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $5, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $59, %k0, %k1
; X32-NEXT: shrb $3, %cl
; X32-NEXT: kmovd %ecx, %k2
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $4, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $60, %k0, %k1
; X32-NEXT: movl %ebx, %eax
; X32-NEXT: shrl $28, %eax
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $3, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $61, %k0, %k1
; X32-NEXT: movl %ebx, %eax
; X32-NEXT: shrl $29, %eax
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $2, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $62, %k0, %k1
; X32-NEXT: movl %ebx, %eax
; X32-NEXT: shrl $30, %eax
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $1, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftlq $1, %k0, %k0
; X32-NEXT: kshiftrq $1, %k0, %k0
; X32-NEXT: shrl $31, %ebx
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $62, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $2, %k0, %k1
; X32-NEXT: movl %eax, %ecx
; X32-NEXT: andb $15, %cl
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $61, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $3, %k0, %k1
; X32-NEXT: shrb $3, %cl
; X32-NEXT: kmovd %ecx, %k2
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $60, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $4, %k0, %k1
; X32-NEXT: movl %eax, %ecx
; X32-NEXT: shrb $4, %cl
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $59, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $5, %k0, %k1
; X32-NEXT: movl %eax, %ecx
; X32-NEXT: shrb $5, %cl
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $58, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $6, %k0, %k1
; X32-NEXT: movl %eax, %ecx
; X32-NEXT: shrb $6, %cl
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $57, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $7, %k0, %k1
; X32-NEXT: movl %eax, %ecx
; X32-NEXT: shrb $7, %cl
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $56, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $8, %k0, %k1
; X32-NEXT: movb %ah, %cl
; X32-NEXT: kmovd %ecx, %k2
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $55, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $9, %k0, %k1
; X32-NEXT: andb $2, %cl
; X32-NEXT: shrb %cl
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $54, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $10, %k0, %k1
; X32-NEXT: movb %ah, %cl
; X32-NEXT: movl %eax, %esi
; X32-NEXT: movl 12(%ebp), %ebx
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $53, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $11, %k0, %k1
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $52, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $12, %k0, %k1
; X32-NEXT: kxorq %k3, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $51, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $13, %k0, %k1
; X32-NEXT: kxorq %k4, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $50, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $14, %k0, %k1
; X32-NEXT: kxorq %k5, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $49, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $15, %k0, %k1
; X32-NEXT: shrl $15, %edx
; X32-NEXT: kmovd %edx, %k2
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $48, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $16, %k0, %k1
; X32-NEXT: kmovd %eax, %k2
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $47, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $17, %k0, %k1
; X32-NEXT: kxorq %k6, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $46, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $18, %k0, %k1
; X32-NEXT: kxorq %k7, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $45, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $19, %k0, %k1
; X32-NEXT: shrb $3, %cl
; X32-NEXT: kmovd %ecx, %k2
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $44, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $20, %k0, %k1
; X32-NEXT: movl %eax, %ecx
; X32-NEXT: shrb $4, %cl
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $43, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $21, %k0, %k1
; X32-NEXT: movl %eax, %ecx
; X32-NEXT: shrb $5, %cl
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $42, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $22, %k0, %k1
; X32-NEXT: movl %eax, %ecx
; X32-NEXT: shrb $6, %cl
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $41, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $23, %k0, %k1
; X32-NEXT: shrb $7, %al
; X32-NEXT: kmovd %eax, %k2
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $40, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $24, %k0, %k1
; X32-NEXT: movl %esi, %edx
; X32-NEXT: shrl $24, %edx
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $39, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $25, %k0, %k1
; X32-NEXT: movl %edx, %eax
; X32-NEXT: andb $2, %al
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $38, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $26, %k0, %k1
; X32-NEXT: andb $15, %dl
; X32-NEXT: movl %edx, %eax
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $37, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $27, %k0, %k1
; X32-NEXT: shrb $3, %dl
; X32-NEXT: kmovd %edx, %k2
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $36, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $28, %k0, %k1
; X32-NEXT: movl %esi, %ecx
; X32-NEXT: movl %ecx, %eax
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $35, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $29, %k0, %k1
; X32-NEXT: movl %ecx, %eax
; X32-NEXT: shrl $29, %eax
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $34, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $30, %k0, %k1
; X32-NEXT: movl %ecx, %eax
; X32-NEXT: shrl $30, %eax
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $33, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $31, %k0, %k1
; X32-NEXT: shrl $31, %ecx
; X32-NEXT: kmovd %ecx, %k2
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $32, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $32, %k0, %k1
; X32-NEXT: kmovd %ebx, %k2
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $31, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $33, %k0, %k1
; X32-NEXT: movl %ebx, %eax
; X32-NEXT: andb $2, %al
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $30, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $34, %k0, %k1
; X32-NEXT: movl %ebx, %eax
; X32-NEXT: andb $15, %al
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $29, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $35, %k0, %k1
; X32-NEXT: shrb $3, %al
; X32-NEXT: kmovd %eax, %k2
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $28, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $36, %k0, %k1
; X32-NEXT: movl %ebx, %eax
; X32-NEXT: shrb $4, %al
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $27, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $37, %k0, %k1
; X32-NEXT: movl %ebx, %eax
; X32-NEXT: shrb $5, %al
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $26, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $38, %k0, %k1
; X32-NEXT: movl %ebx, %eax
; X32-NEXT: shrb $6, %al
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $25, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $39, %k0, %k1
; X32-NEXT: movl %ebx, %eax
; X32-NEXT: shrb $7, %al
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $24, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $40, %k0, %k1
; X32-NEXT: movb %bh, %al
; X32-NEXT: kmovd %eax, %k2
; X32-NEXT: kmovd %eax, %k7
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $23, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $41, %k0, %k1
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $22, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $42, %k0, %k1
; X32-NEXT: kxorq %k3, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $21, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $43, %k0, %k1
; X32-NEXT: kxorq %k4, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $20, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $44, %k0, %k1
; X32-NEXT: movzwl %bx, %eax
; X32-NEXT: movl %eax, %esi
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $19, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $45, %k0, %k1
; X32-NEXT: kxorq %k5, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $18, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $46, %k0, %k1
; X32-NEXT: movl %eax, %esi
; X32-NEXT: shrl $14, %esi
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $17, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $47, %k0, %k1
; X32-NEXT: shrl $15, %eax
; X32-NEXT: kmovd %eax, %k2
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $16, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $48, %k0, %k1
; X32-NEXT: kmovd %ecx, %k2
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $15, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $49, %k0, %k1
; X32-NEXT: kxorq %k6, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $14, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $50, %k0, %k1
; X32-NEXT: kxorq %k7, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $13, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $51, %k0, %k1
; X32-NEXT: shrb $3, %dl
; X32-NEXT: kmovd %edx, %k2
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $12, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $52, %k0, %k1
; X32-NEXT: movl %ecx, %eax
; X32-NEXT: shrb $4, %al
; X32-NEXT: kmovd %eax, %k7
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $11, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $53, %k0, %k1
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $10, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $54, %k0, %k1
; X32-NEXT: kxorq %k3, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $9, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $55, %k0, %k1
; X32-NEXT: kxorq %k4, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $8, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $56, %k0, %k1
; X32-NEXT: kxorq %k5, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $7, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $57, %k0, %k1
; X32-NEXT: kxorq %k6, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $6, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $58, %k0, %k1
; X32-NEXT: kxorq %k7, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $5, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $59, %k0, %k1
; X32-NEXT: shrb $3, %cl
; X32-NEXT: kmovd %ecx, %k2
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $4, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $60, %k0, %k1
; X32-NEXT: movl %ebx, %eax
; X32-NEXT: shrl $28, %eax
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $3, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $61, %k0, %k1
; X32-NEXT: movl %ebx, %eax
; X32-NEXT: shrl $29, %eax
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $2, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftrq $62, %k0, %k1
; X32-NEXT: movl %ebx, %eax
; X32-NEXT: shrl $30, %eax
; X32-NEXT: kxorq %k2, %k1, %k1
; X32-NEXT: kshiftlq $63, %k1, %k1
; X32-NEXT: kshiftrq $1, %k1, %k1
-; X32-NEXT: kxorq %k0, %k1, %k0
+; X32-NEXT: kxorq %k1, %k0, %k0
; X32-NEXT: kshiftlq $1, %k0, %k0
; X32-NEXT: kshiftrq $1, %k0, %k0
; X32-NEXT: shrl $31, %ebx
; AVX512F-32-NEXT: kxorq %k1, %k7, %k1
; AVX512F-32-NEXT: kshiftlq $63, %k1, %k1
; AVX512F-32-NEXT: kshiftrq $62, %k1, %k1
-; AVX512F-32-NEXT: kxorq %k5, %k1, %k7
+; AVX512F-32-NEXT: kxorq %k1, %k5, %k7
; AVX512F-32-NEXT: kshiftrq $2, %k7, %k1
; AVX512F-32-NEXT: kxorq %k2, %k1, %k2
; AVX512F-32-NEXT: kmovd %ecx, %k5
; AVX512F-32-NEXT: shrb %cl
; AVX512F-32-NEXT: kshiftlq $63, %k2, %k2
; AVX512F-32-NEXT: kshiftrq $61, %k2, %k2
-; AVX512F-32-NEXT: kxorq %k7, %k2, %k7
+; AVX512F-32-NEXT: kxorq %k2, %k7, %k7
; AVX512F-32-NEXT: kshiftrq $3, %k7, %k2
; AVX512F-32-NEXT: kxorq %k0, %k2, %k0
; AVX512F-32-NEXT: kmovd %ecx, %k2
; AVX512F-32-NEXT: shrb $2, %dl
; AVX512F-32-NEXT: kshiftlq $63, %k0, %k0
; AVX512F-32-NEXT: kshiftrq $60, %k0, %k0
-; AVX512F-32-NEXT: kxorq %k7, %k0, %k0
+; AVX512F-32-NEXT: kxorq %k0, %k7, %k0
; AVX512F-32-NEXT: kshiftrq $4, %k0, %k7
; AVX512F-32-NEXT: kxorq %k3, %k7, %k7
; AVX512F-32-NEXT: kmovd %edx, %k3
; AVX512F-32-NEXT: shrb $3, %cl
; AVX512F-32-NEXT: kshiftlq $63, %k7, %k7
; AVX512F-32-NEXT: kshiftrq $59, %k7, %k7
-; AVX512F-32-NEXT: kxorq %k0, %k7, %k7
+; AVX512F-32-NEXT: kxorq %k7, %k0, %k7
; AVX512F-32-NEXT: kshiftrq $5, %k7, %k0
; AVX512F-32-NEXT: kxorq %k4, %k0, %k4
; AVX512F-32-NEXT: kmovd %ecx, %k0
; AVX512F-32-NEXT: andb $1, %cl
; AVX512F-32-NEXT: kshiftlq $63, %k4, %k4
; AVX512F-32-NEXT: kshiftrq $58, %k4, %k4
-; AVX512F-32-NEXT: kxorq %k7, %k4, %k7
+; AVX512F-32-NEXT: kxorq %k4, %k7, %k7
; AVX512F-32-NEXT: kshiftrq $6, %k7, %k4
; AVX512F-32-NEXT: kxorq %k6, %k4, %k6
; AVX512F-32-NEXT: kmovd %ecx, %k4
; AVX512F-32-NEXT: shrb %bl
; AVX512F-32-NEXT: kshiftlq $63, %k6, %k6
; AVX512F-32-NEXT: kshiftrq $57, %k6, %k6
-; AVX512F-32-NEXT: kxorq %k7, %k6, %k6
+; AVX512F-32-NEXT: kxorq %k6, %k7, %k6
; AVX512F-32-NEXT: kshiftrq $7, %k6, %k7
; AVX512F-32-NEXT: kxorq %k5, %k7, %k7
; AVX512F-32-NEXT: kmovd %ebx, %k5
; AVX512F-32-NEXT: shrb $2, %dl
; AVX512F-32-NEXT: kshiftlq $63, %k7, %k7
; AVX512F-32-NEXT: kshiftrq $56, %k7, %k7
-; AVX512F-32-NEXT: kxorq %k6, %k7, %k7
+; AVX512F-32-NEXT: kxorq %k7, %k6, %k7
; AVX512F-32-NEXT: kshiftrq $8, %k7, %k6
; AVX512F-32-NEXT: kxorq %k1, %k6, %k1
; AVX512F-32-NEXT: kmovd %edx, %k6
; AVX512F-32-NEXT: shrb $3, %cl
; AVX512F-32-NEXT: kshiftlq $63, %k1, %k1
; AVX512F-32-NEXT: kshiftrq $55, %k1, %k1
-; AVX512F-32-NEXT: kxorq %k7, %k1, %k7
+; AVX512F-32-NEXT: kxorq %k1, %k7, %k7
; AVX512F-32-NEXT: kshiftrq $9, %k7, %k1
; AVX512F-32-NEXT: kxorq %k2, %k1, %k2
; AVX512F-32-NEXT: kmovd %ecx, %k1
; AVX512F-32-NEXT: shrb $4, %cl
; AVX512F-32-NEXT: kshiftlq $63, %k2, %k2
; AVX512F-32-NEXT: kshiftrq $54, %k2, %k2
-; AVX512F-32-NEXT: kxorq %k7, %k2, %k7
+; AVX512F-32-NEXT: kxorq %k2, %k7, %k7
; AVX512F-32-NEXT: kshiftrq $10, %k7, %k2
; AVX512F-32-NEXT: kxorq %k3, %k2, %k3
; AVX512F-32-NEXT: kmovd %ecx, %k2
; AVX512F-32-NEXT: shrl $12, %edx
; AVX512F-32-NEXT: kshiftlq $63, %k3, %k3
; AVX512F-32-NEXT: kshiftrq $53, %k3, %k3
-; AVX512F-32-NEXT: kxorq %k7, %k3, %k3
+; AVX512F-32-NEXT: kxorq %k3, %k7, %k3
; AVX512F-32-NEXT: kshiftrq $11, %k3, %k7
; AVX512F-32-NEXT: kxorq %k0, %k7, %k0
; AVX512F-32-NEXT: kshiftlq $63, %k0, %k0
; AVX512F-32-NEXT: kshiftrq $52, %k0, %k0
-; AVX512F-32-NEXT: kxorq %k3, %k0, %k3
+; AVX512F-32-NEXT: kxorq %k0, %k3, %k3
; AVX512F-32-NEXT: kshiftrq $12, %k3, %k0
; AVX512F-32-NEXT: kmovd %edx, %k7
; AVX512F-32-NEXT: kxorq %k7, %k0, %k7
; AVX512F-32-NEXT: shrl $14, %edi
; AVX512F-32-NEXT: kshiftlq $63, %k7, %k7
; AVX512F-32-NEXT: kshiftrq $51, %k7, %k7
-; AVX512F-32-NEXT: kxorq %k3, %k7, %k3
+; AVX512F-32-NEXT: kxorq %k7, %k3, %k3
; AVX512F-32-NEXT: kshiftrq $13, %k3, %k7
; AVX512F-32-NEXT: kxorq %k4, %k7, %k4
; AVX512F-32-NEXT: kshiftlq $63, %k4, %k4
; AVX512F-32-NEXT: kshiftrq $50, %k4, %k4
-; AVX512F-32-NEXT: kxorq %k3, %k4, %k3
+; AVX512F-32-NEXT: kxorq %k4, %k3, %k3
; AVX512F-32-NEXT: kshiftrq $14, %k3, %k4
; AVX512F-32-NEXT: kmovd %edi, %k7
; AVX512F-32-NEXT: kxorq %k7, %k4, %k4
; AVX512F-32-NEXT: kshiftlq $63, %k4, %k4
; AVX512F-32-NEXT: kshiftrq $49, %k4, %k4
-; AVX512F-32-NEXT: kxorq %k3, %k4, %k3
+; AVX512F-32-NEXT: kxorq %k4, %k3, %k3
; AVX512F-32-NEXT: kshiftrq $15, %k3, %k4
; AVX512F-32-NEXT: kmovd %esi, %k7
; AVX512F-32-NEXT: kxorq %k7, %k4, %k4
; AVX512F-32-NEXT: kshiftlq $63, %k4, %k4
; AVX512F-32-NEXT: kshiftrq $48, %k4, %k4
-; AVX512F-32-NEXT: kxorq %k3, %k4, %k3
+; AVX512F-32-NEXT: kxorq %k4, %k3, %k3
; AVX512F-32-NEXT: kshiftrq $16, %k3, %k4
; AVX512F-32-NEXT: kmovd %eax, %k7
; AVX512F-32-NEXT: kxorq %k7, %k4, %k4
; AVX512F-32-NEXT: shrb $7, %al
; AVX512F-32-NEXT: kshiftlq $63, %k4, %k4
; AVX512F-32-NEXT: kshiftrq $47, %k4, %k4
-; AVX512F-32-NEXT: kxorq %k3, %k4, %k3
+; AVX512F-32-NEXT: kxorq %k4, %k3, %k3
; AVX512F-32-NEXT: kshiftrq $17, %k3, %k4
; AVX512F-32-NEXT: kxorq %k5, %k4, %k4
; AVX512F-32-NEXT: kmovd %eax, %k5
; AVX512F-32-NEXT: movl %edx, %eax
; AVX512F-32-NEXT: kshiftlq $63, %k4, %k4
; AVX512F-32-NEXT: kshiftrq $46, %k4, %k4
-; AVX512F-32-NEXT: kxorq %k3, %k4, %k4
+; AVX512F-32-NEXT: kxorq %k4, %k3, %k4
; AVX512F-32-NEXT: kshiftrq $18, %k4, %k3
; AVX512F-32-NEXT: kxorq %k6, %k3, %k6
; AVX512F-32-NEXT: kmovd %edx, %k3
; AVX512F-32-NEXT: shrb %al
; AVX512F-32-NEXT: kshiftlq $63, %k6, %k6
; AVX512F-32-NEXT: kshiftrq $45, %k6, %k6
-; AVX512F-32-NEXT: kxorq %k4, %k6, %k6
+; AVX512F-32-NEXT: kxorq %k6, %k4, %k6
; AVX512F-32-NEXT: kshiftrq $19, %k6, %k4
; AVX512F-32-NEXT: kxorq %k1, %k4, %k1
; AVX512F-32-NEXT: kmovd %eax, %k4
; AVX512F-32-NEXT: shrb $2, %dl
; AVX512F-32-NEXT: kshiftlq $63, %k1, %k1
; AVX512F-32-NEXT: kshiftrq $44, %k1, %k1
-; AVX512F-32-NEXT: kxorq %k6, %k1, %k1
+; AVX512F-32-NEXT: kxorq %k1, %k6, %k1
; AVX512F-32-NEXT: kshiftrq $20, %k1, %k6
; AVX512F-32-NEXT: kxorq %k2, %k6, %k6
; AVX512F-32-NEXT: kmovd %edx, %k2
; AVX512F-32-NEXT: shrb $3, %cl
; AVX512F-32-NEXT: kshiftlq $63, %k6, %k6
; AVX512F-32-NEXT: kshiftrq $43, %k6, %k6
-; AVX512F-32-NEXT: kxorq %k1, %k6, %k6
+; AVX512F-32-NEXT: kxorq %k6, %k1, %k6
; AVX512F-32-NEXT: kshiftrq $21, %k6, %k1
; AVX512F-32-NEXT: kxorq %k0, %k1, %k0
; AVX512F-32-NEXT: kmovd %ecx, %k1
; AVX512F-32-NEXT: andb $1, %cl
; AVX512F-32-NEXT: kshiftlq $63, %k0, %k0
; AVX512F-32-NEXT: kshiftrq $42, %k0, %k0
-; AVX512F-32-NEXT: kxorq %k6, %k0, %k6
+; AVX512F-32-NEXT: kxorq %k0, %k6, %k6
; AVX512F-32-NEXT: kshiftrq $22, %k6, %k0
; AVX512F-32-NEXT: kxorq %k7, %k0, %k7
; AVX512F-32-NEXT: kmovd %ecx, %k0
; AVX512F-32-NEXT: shrb %dl
; AVX512F-32-NEXT: kshiftlq $63, %k7, %k7
; AVX512F-32-NEXT: kshiftrq $41, %k7, %k7
-; AVX512F-32-NEXT: kxorq %k6, %k7, %k6
+; AVX512F-32-NEXT: kxorq %k7, %k6, %k6
; AVX512F-32-NEXT: kshiftrq $23, %k6, %k7
; AVX512F-32-NEXT: kxorq %k5, %k7, %k7
; AVX512F-32-NEXT: kmovd %edx, %k5
; AVX512F-32-NEXT: shrb $2, %al
; AVX512F-32-NEXT: kshiftlq $63, %k7, %k7
; AVX512F-32-NEXT: kshiftrq $40, %k7, %k7
-; AVX512F-32-NEXT: kxorq %k6, %k7, %k7
+; AVX512F-32-NEXT: kxorq %k7, %k6, %k7
; AVX512F-32-NEXT: kshiftrq $24, %k7, %k6
; AVX512F-32-NEXT: kxorq %k3, %k6, %k3
; AVX512F-32-NEXT: kmovd %eax, %k6
; AVX512F-32-NEXT: shrb $3, %cl
; AVX512F-32-NEXT: kshiftlq $63, %k3, %k3
; AVX512F-32-NEXT: kshiftrq $39, %k3, %k3
-; AVX512F-32-NEXT: kxorq %k7, %k3, %k7
+; AVX512F-32-NEXT: kxorq %k3, %k7, %k7
; AVX512F-32-NEXT: kshiftrq $25, %k7, %k3
; AVX512F-32-NEXT: kxorq %k4, %k3, %k4
; AVX512F-32-NEXT: kmovd %ecx, %k3
; AVX512F-32-NEXT: shrb $4, %cl
; AVX512F-32-NEXT: kshiftlq $63, %k4, %k4
; AVX512F-32-NEXT: kshiftrq $38, %k4, %k4
-; AVX512F-32-NEXT: kxorq %k7, %k4, %k4
+; AVX512F-32-NEXT: kxorq %k4, %k7, %k4
; AVX512F-32-NEXT: kshiftrq $26, %k4, %k7
; AVX512F-32-NEXT: kxorq %k2, %k7, %k7
; AVX512F-32-NEXT: kmovd %ecx, %k2
; AVX512F-32-NEXT: shrl $28, %edx
; AVX512F-32-NEXT: kshiftlq $63, %k7, %k7
; AVX512F-32-NEXT: kshiftrq $37, %k7, %k7
-; AVX512F-32-NEXT: kxorq %k4, %k7, %k4
+; AVX512F-32-NEXT: kxorq %k7, %k4, %k4
; AVX512F-32-NEXT: kshiftrq $27, %k4, %k7
; AVX512F-32-NEXT: kxorq %k1, %k7, %k1
; AVX512F-32-NEXT: kshiftlq $63, %k1, %k1
; AVX512F-32-NEXT: kshiftrq $36, %k1, %k1
-; AVX512F-32-NEXT: kxorq %k4, %k1, %k1
+; AVX512F-32-NEXT: kxorq %k1, %k4, %k1
; AVX512F-32-NEXT: kshiftrq $28, %k1, %k4
; AVX512F-32-NEXT: kmovd %edx, %k7
; AVX512F-32-NEXT: kxorq %k7, %k4, %k7
; AVX512F-32-NEXT: shrl $30, %esi
; AVX512F-32-NEXT: kshiftlq $63, %k7, %k7
; AVX512F-32-NEXT: kshiftrq $35, %k7, %k7
-; AVX512F-32-NEXT: kxorq %k1, %k7, %k1
+; AVX512F-32-NEXT: kxorq %k7, %k1, %k1
; AVX512F-32-NEXT: kshiftrq $29, %k1, %k7
; AVX512F-32-NEXT: kxorq %k0, %k7, %k0
; AVX512F-32-NEXT: kshiftlq $63, %k0, %k0
; AVX512F-32-NEXT: kshiftrq $34, %k0, %k0
-; AVX512F-32-NEXT: kxorq %k1, %k0, %k0
+; AVX512F-32-NEXT: kxorq %k0, %k1, %k0
; AVX512F-32-NEXT: kshiftrq $30, %k0, %k1
; AVX512F-32-NEXT: kmovd %esi, %k7
; AVX512F-32-NEXT: kxorq %k7, %k1, %k1
; AVX512F-32-NEXT: kshiftlq $63, %k1, %k1
; AVX512F-32-NEXT: kshiftrq $33, %k1, %k1
-; AVX512F-32-NEXT: kxorq %k0, %k1, %k0
+; AVX512F-32-NEXT: kxorq %k1, %k0, %k0
; AVX512F-32-NEXT: kshiftrq $31, %k0, %k1
; AVX512F-32-NEXT: kmovd %ecx, %k7
; AVX512F-32-NEXT: kxorq %k7, %k1, %k1
; AVX512F-32-NEXT: kshiftlq $63, %k1, %k1
; AVX512F-32-NEXT: kshiftrq $32, %k1, %k1
-; AVX512F-32-NEXT: kxorq %k0, %k1, %k0
+; AVX512F-32-NEXT: kxorq %k1, %k0, %k0
; AVX512F-32-NEXT: kshiftrq $32, %k0, %k1
; AVX512F-32-NEXT: kmovd %ebx, %k7
; AVX512F-32-NEXT: kxorq %k7, %k1, %k1
; AVX512F-32-NEXT: shrb $7, %cl
; AVX512F-32-NEXT: kshiftlq $63, %k1, %k1
; AVX512F-32-NEXT: kshiftrq $31, %k1, %k1
-; AVX512F-32-NEXT: kxorq %k0, %k1, %k0
+; AVX512F-32-NEXT: kxorq %k1, %k0, %k0
; AVX512F-32-NEXT: kshiftrq $33, %k0, %k1
; AVX512F-32-NEXT: kxorq %k5, %k1, %k1
; AVX512F-32-NEXT: kshiftlq $63, %k1, %k1
; AVX512F-32-NEXT: kshiftrq $30, %k1, %k1
-; AVX512F-32-NEXT: kxorq %k0, %k1, %k0
+; AVX512F-32-NEXT: kxorq %k1, %k0, %k0
; AVX512F-32-NEXT: kshiftrq $34, %k0, %k1
; AVX512F-32-NEXT: kxorq %k6, %k1, %k5
; AVX512F-32-NEXT: kmovd %ecx, %k6
; AVX512F-32-NEXT: shrb %cl
; AVX512F-32-NEXT: kshiftlq $63, %k5, %k5
; AVX512F-32-NEXT: kshiftrq $29, %k5, %k5
-; AVX512F-32-NEXT: kxorq %k0, %k5, %k5
+; AVX512F-32-NEXT: kxorq %k5, %k0, %k5
; AVX512F-32-NEXT: kshiftrq $35, %k5, %k0
; AVX512F-32-NEXT: kxorq %k3, %k0, %k3
; AVX512F-32-NEXT: kmovd %ecx, %k0
; AVX512F-32-NEXT: shrb $2, %al
; AVX512F-32-NEXT: kshiftlq $63, %k3, %k3
; AVX512F-32-NEXT: kshiftrq $28, %k3, %k3
-; AVX512F-32-NEXT: kxorq %k5, %k3, %k5
+; AVX512F-32-NEXT: kxorq %k3, %k5, %k5
; AVX512F-32-NEXT: kshiftrq $36, %k5, %k3
; AVX512F-32-NEXT: kxorq %k2, %k3, %k2
; AVX512F-32-NEXT: kmovd %eax, %k3
; AVX512F-32-NEXT: shrb $3, %cl
; AVX512F-32-NEXT: kshiftlq $63, %k2, %k2
; AVX512F-32-NEXT: kshiftrq $27, %k2, %k2
-; AVX512F-32-NEXT: kxorq %k5, %k2, %k2
+; AVX512F-32-NEXT: kxorq %k2, %k5, %k2
; AVX512F-32-NEXT: kshiftrq $37, %k2, %k5
; AVX512F-32-NEXT: kxorq %k4, %k5, %k5
; AVX512F-32-NEXT: kmovd %ecx, %k4
; AVX512F-32-NEXT: andb $1, %cl
; AVX512F-32-NEXT: kshiftlq $63, %k5, %k5
; AVX512F-32-NEXT: kshiftrq $26, %k5, %k5
-; AVX512F-32-NEXT: kxorq %k2, %k5, %k2
+; AVX512F-32-NEXT: kxorq %k5, %k2, %k2
; AVX512F-32-NEXT: kshiftrq $38, %k2, %k5
; AVX512F-32-NEXT: kxorq %k7, %k5, %k7
; AVX512F-32-NEXT: kmovd %ecx, %k5
; AVX512F-32-NEXT: shrb %dl
; AVX512F-32-NEXT: kshiftlq $63, %k7, %k7
; AVX512F-32-NEXT: kshiftrq $25, %k7, %k7
-; AVX512F-32-NEXT: kxorq %k2, %k7, %k7
+; AVX512F-32-NEXT: kxorq %k7, %k2, %k7
; AVX512F-32-NEXT: kshiftrq $39, %k7, %k2
; AVX512F-32-NEXT: kxorq %k6, %k2, %k6
; AVX512F-32-NEXT: kmovd %edx, %k2
; AVX512F-32-NEXT: shrb $2, %cl
; AVX512F-32-NEXT: kshiftlq $63, %k6, %k6
; AVX512F-32-NEXT: kshiftrq $24, %k6, %k6
-; AVX512F-32-NEXT: kxorq %k7, %k6, %k6
+; AVX512F-32-NEXT: kxorq %k6, %k7, %k6
; AVX512F-32-NEXT: kshiftrq $40, %k6, %k7
; AVX512F-32-NEXT: kxorq %k1, %k7, %k7
; AVX512F-32-NEXT: kmovd %ecx, %k1
; AVX512F-32-NEXT: shrl $12, %ecx
; AVX512F-32-NEXT: kshiftlq $63, %k7, %k7
; AVX512F-32-NEXT: kshiftrq $23, %k7, %k7
-; AVX512F-32-NEXT: kxorq %k6, %k7, %k6
+; AVX512F-32-NEXT: kxorq %k7, %k6, %k6
; AVX512F-32-NEXT: kshiftrq $41, %k6, %k7
; AVX512F-32-NEXT: kxorq %k0, %k7, %k0
; AVX512F-32-NEXT: kmovd %ecx, %k1
; AVX512F-32-NEXT: shrl $14, %edi
; AVX512F-32-NEXT: kshiftlq $63, %k0, %k0
; AVX512F-32-NEXT: kshiftrq $22, %k0, %k0
-; AVX512F-32-NEXT: kxorq %k6, %k0, %k0
+; AVX512F-32-NEXT: kxorq %k0, %k6, %k0
; AVX512F-32-NEXT: kshiftrq $42, %k0, %k6
; AVX512F-32-NEXT: kxorq %k3, %k6, %k3
; AVX512F-32-NEXT: kmovd %edi, %k7
; AVX512F-32-NEXT: shrl $15, %esi
; AVX512F-32-NEXT: kshiftlq $63, %k3, %k3
; AVX512F-32-NEXT: kshiftrq $21, %k3, %k3
-; AVX512F-32-NEXT: kxorq %k0, %k3, %k0
+; AVX512F-32-NEXT: kxorq %k3, %k0, %k0
; AVX512F-32-NEXT: kshiftrq $43, %k0, %k3
; AVX512F-32-NEXT: kxorq %k4, %k3, %k3
; AVX512F-32-NEXT: kmovd %esi, %k6
; AVX512F-32-NEXT: shrb $3, %dl
; AVX512F-32-NEXT: kshiftlq $63, %k3, %k3
; AVX512F-32-NEXT: kshiftrq $20, %k3, %k3
-; AVX512F-32-NEXT: kxorq %k0, %k3, %k3
+; AVX512F-32-NEXT: kxorq %k3, %k0, %k3
; AVX512F-32-NEXT: kshiftrq $44, %k3, %k0
; AVX512F-32-NEXT: kxorq %k1, %k0, %k1
; AVX512F-32-NEXT: kmovd %edx, %k0
; AVX512F-32-NEXT: shrb $4, %cl
; AVX512F-32-NEXT: kshiftlq $63, %k1, %k1
; AVX512F-32-NEXT: kshiftrq $19, %k1, %k1
-; AVX512F-32-NEXT: kxorq %k3, %k1, %k1
+; AVX512F-32-NEXT: kxorq %k1, %k3, %k1
; AVX512F-32-NEXT: kshiftrq $45, %k1, %k3
; AVX512F-32-NEXT: kxorq %k5, %k3, %k4
; AVX512F-32-NEXT: kmovd %ecx, %k3
; AVX512F-32-NEXT: andb $1, %cl
; AVX512F-32-NEXT: kshiftlq $63, %k4, %k4
; AVX512F-32-NEXT: kshiftrq $18, %k4, %k4
-; AVX512F-32-NEXT: kxorq %k1, %k4, %k1
+; AVX512F-32-NEXT: kxorq %k4, %k1, %k1
; AVX512F-32-NEXT: kshiftrq $46, %k1, %k4
; AVX512F-32-NEXT: kxorq %k7, %k4, %k5
; AVX512F-32-NEXT: kmovd %ecx, %k4
; AVX512F-32-NEXT: shrb $6, %cl
; AVX512F-32-NEXT: kshiftlq $63, %k5, %k5
; AVX512F-32-NEXT: kshiftrq $17, %k5, %k5
-; AVX512F-32-NEXT: kxorq %k1, %k5, %k1
+; AVX512F-32-NEXT: kxorq %k5, %k1, %k1
; AVX512F-32-NEXT: kshiftrq $47, %k1, %k5
; AVX512F-32-NEXT: kxorq %k6, %k5, %k5
; AVX512F-32-NEXT: kshiftlq $63, %k5, %k5
; AVX512F-32-NEXT: kshiftrq $16, %k5, %k5
-; AVX512F-32-NEXT: kxorq %k1, %k5, %k1
+; AVX512F-32-NEXT: kxorq %k5, %k1, %k1
; AVX512F-32-NEXT: kshiftrq $48, %k1, %k5
; AVX512F-32-NEXT: kmovd %eax, %k6
; AVX512F-32-NEXT: kxorq %k6, %k5, %k6
; AVX512F-32-NEXT: shrb $7, %al
; AVX512F-32-NEXT: kshiftlq $63, %k6, %k6
; AVX512F-32-NEXT: kshiftrq $15, %k6, %k6
-; AVX512F-32-NEXT: kxorq %k1, %k6, %k1
+; AVX512F-32-NEXT: kxorq %k6, %k1, %k1
; AVX512F-32-NEXT: kshiftrq $49, %k1, %k6
; AVX512F-32-NEXT: kxorq %k2, %k6, %k6
; AVX512F-32-NEXT: kmovd %eax, %k2
; AVX512F-32-NEXT: movl %edx, %eax
; AVX512F-32-NEXT: kshiftlq $63, %k6, %k6
; AVX512F-32-NEXT: kshiftrq $14, %k6, %k6
-; AVX512F-32-NEXT: kxorq %k1, %k6, %k6
+; AVX512F-32-NEXT: kxorq %k6, %k1, %k6
; AVX512F-32-NEXT: kshiftrq $50, %k6, %k1
; AVX512F-32-NEXT: kmovq {{[0-9]+}}(%esp), %k7 # 8-byte Reload
; AVX512F-32-NEXT: kxorq %k7, %k1, %k7
; AVX512F-32-NEXT: shrb %al
; AVX512F-32-NEXT: kshiftlq $63, %k7, %k7
; AVX512F-32-NEXT: kshiftrq $13, %k7, %k7
-; AVX512F-32-NEXT: kxorq %k6, %k7, %k6
+; AVX512F-32-NEXT: kxorq %k7, %k6, %k6
; AVX512F-32-NEXT: kshiftrq $51, %k6, %k7
; AVX512F-32-NEXT: kxorq %k0, %k7, %k7
; AVX512F-32-NEXT: kmovd %eax, %k0
; AVX512F-32-NEXT: shrb $2, %dl
; AVX512F-32-NEXT: kshiftlq $63, %k7, %k7
; AVX512F-32-NEXT: kshiftrq $12, %k7, %k7
-; AVX512F-32-NEXT: kxorq %k6, %k7, %k6
+; AVX512F-32-NEXT: kxorq %k7, %k6, %k6
; AVX512F-32-NEXT: kshiftrq $52, %k6, %k7
; AVX512F-32-NEXT: kxorq %k3, %k7, %k7
; AVX512F-32-NEXT: kmovd %edx, %k3
; AVX512F-32-NEXT: shrb $3, %al
; AVX512F-32-NEXT: kshiftlq $63, %k7, %k7
; AVX512F-32-NEXT: kshiftrq $11, %k7, %k7
-; AVX512F-32-NEXT: kxorq %k6, %k7, %k6
+; AVX512F-32-NEXT: kxorq %k7, %k6, %k6
; AVX512F-32-NEXT: kshiftrq $53, %k6, %k7
; AVX512F-32-NEXT: kxorq %k4, %k7, %k7
; AVX512F-32-NEXT: kmovd %eax, %k4
; AVX512F-32-NEXT: andb $1, %al
; AVX512F-32-NEXT: kshiftlq $63, %k7, %k7
; AVX512F-32-NEXT: kshiftrq $10, %k7, %k7
-; AVX512F-32-NEXT: kxorq %k6, %k7, %k6
+; AVX512F-32-NEXT: kxorq %k7, %k6, %k6
; AVX512F-32-NEXT: kshiftrq $54, %k6, %k7
; AVX512F-32-NEXT: kxorq %k5, %k7, %k7
; AVX512F-32-NEXT: kmovd %eax, %k5
; AVX512F-32-NEXT: kshiftlq $63, %k7, %k7
; AVX512F-32-NEXT: kshiftrq $9, %k7, %k7
-; AVX512F-32-NEXT: kxorq %k6, %k7, %k6
+; AVX512F-32-NEXT: kxorq %k7, %k6, %k6
; AVX512F-32-NEXT: kshiftrq $55, %k6, %k7
; AVX512F-32-NEXT: kxorq %k2, %k7, %k2
; AVX512F-32-NEXT: kshiftlq $63, %k2, %k2
; AVX512F-32-NEXT: kshiftrq $8, %k2, %k2
-; AVX512F-32-NEXT: kxorq %k6, %k2, %k2
+; AVX512F-32-NEXT: kxorq %k2, %k6, %k2
; AVX512F-32-NEXT: kshiftrq $56, %k2, %k6
; AVX512F-32-NEXT: kxorq %k1, %k6, %k1
; AVX512F-32-NEXT: kshiftlq $63, %k1, %k1
; AVX512F-32-NEXT: kshiftrq $7, %k1, %k1
-; AVX512F-32-NEXT: kxorq %k2, %k1, %k1
+; AVX512F-32-NEXT: kxorq %k1, %k2, %k1
; AVX512F-32-NEXT: kshiftrq $57, %k1, %k2
; AVX512F-32-NEXT: kxorq %k0, %k2, %k0
; AVX512F-32-NEXT: kshiftlq $63, %k0, %k0
; AVX512F-32-NEXT: kshiftrq $6, %k0, %k0
-; AVX512F-32-NEXT: kxorq %k1, %k0, %k0
+; AVX512F-32-NEXT: kxorq %k0, %k1, %k0
; AVX512F-32-NEXT: kshiftrq $58, %k0, %k1
; AVX512F-32-NEXT: kxorq %k3, %k1, %k1
; AVX512F-32-NEXT: movl %ebx, %eax
; AVX512F-32-NEXT: shrl $28, %eax
; AVX512F-32-NEXT: kshiftlq $63, %k1, %k1
; AVX512F-32-NEXT: kshiftrq $5, %k1, %k1
-; AVX512F-32-NEXT: kxorq %k0, %k1, %k0
+; AVX512F-32-NEXT: kxorq %k1, %k0, %k0
; AVX512F-32-NEXT: kshiftrq $59, %k0, %k1
; AVX512F-32-NEXT: kxorq %k4, %k1, %k1
; AVX512F-32-NEXT: kshiftlq $63, %k1, %k1
; AVX512F-32-NEXT: kshiftrq $4, %k1, %k1
-; AVX512F-32-NEXT: kxorq %k0, %k1, %k0
+; AVX512F-32-NEXT: kxorq %k1, %k0, %k0
; AVX512F-32-NEXT: kshiftrq $60, %k0, %k1
; AVX512F-32-NEXT: kmovd %eax, %k2
; AVX512F-32-NEXT: kxorq %k2, %k1, %k1
; AVX512F-32-NEXT: shrl $30, %ecx
; AVX512F-32-NEXT: kshiftlq $63, %k1, %k1
; AVX512F-32-NEXT: kshiftrq $3, %k1, %k1
-; AVX512F-32-NEXT: kxorq %k0, %k1, %k0
+; AVX512F-32-NEXT: kxorq %k1, %k0, %k0
; AVX512F-32-NEXT: kshiftrq $61, %k0, %k1
; AVX512F-32-NEXT: kxorq %k5, %k1, %k1
; AVX512F-32-NEXT: kshiftlq $63, %k1, %k1
; AVX512F-32-NEXT: kshiftrq $2, %k1, %k1
-; AVX512F-32-NEXT: kxorq %k0, %k1, %k0
+; AVX512F-32-NEXT: kxorq %k1, %k0, %k0
; AVX512F-32-NEXT: kshiftrq $62, %k0, %k1
; AVX512F-32-NEXT: kmovd %ecx, %k2
; AVX512F-32-NEXT: kxorq %k2, %k1, %k1
; AVX512F-32-NEXT: kshiftlq $63, %k1, %k1
; AVX512F-32-NEXT: kshiftrq $1, %k1, %k1
-; AVX512F-32-NEXT: kxorq %k0, %k1, %k0
+; AVX512F-32-NEXT: kxorq %k1, %k0, %k0
; AVX512F-32-NEXT: kshiftlq $1, %k0, %k0
; AVX512F-32-NEXT: kshiftrq $1, %k0, %k0
; AVX512F-32-NEXT: kmovd %eax, %k1
; AVX512F-32-NEXT: kxorq %k1, %k7, %k1
; AVX512F-32-NEXT: kshiftlq $63, %k1, %k1
; AVX512F-32-NEXT: kshiftrq $62, %k1, %k1
-; AVX512F-32-NEXT: kxorq %k5, %k1, %k7
+; AVX512F-32-NEXT: kxorq %k1, %k5, %k7
; AVX512F-32-NEXT: kshiftrq $2, %k7, %k1
; AVX512F-32-NEXT: kxorq %k2, %k1, %k2
; AVX512F-32-NEXT: kmovd %ecx, %k5
; AVX512F-32-NEXT: shrb %cl
; AVX512F-32-NEXT: kshiftlq $63, %k2, %k2
; AVX512F-32-NEXT: kshiftrq $61, %k2, %k2
-; AVX512F-32-NEXT: kxorq %k7, %k2, %k7
+; AVX512F-32-NEXT: kxorq %k2, %k7, %k7
; AVX512F-32-NEXT: kshiftrq $3, %k7, %k2
; AVX512F-32-NEXT: kxorq %k0, %k2, %k0
; AVX512F-32-NEXT: kmovd %ecx, %k2
; AVX512F-32-NEXT: shrb $2, %dl
; AVX512F-32-NEXT: kshiftlq $63, %k0, %k0
; AVX512F-32-NEXT: kshiftrq $60, %k0, %k0
-; AVX512F-32-NEXT: kxorq %k7, %k0, %k0
+; AVX512F-32-NEXT: kxorq %k0, %k7, %k0
; AVX512F-32-NEXT: kshiftrq $4, %k0, %k7
; AVX512F-32-NEXT: kxorq %k3, %k7, %k7
; AVX512F-32-NEXT: kmovd %edx, %k3
; AVX512F-32-NEXT: shrb $3, %cl
; AVX512F-32-NEXT: kshiftlq $63, %k7, %k7
; AVX512F-32-NEXT: kshiftrq $59, %k7, %k7
-; AVX512F-32-NEXT: kxorq %k0, %k7, %k7
+; AVX512F-32-NEXT: kxorq %k7, %k0, %k7
; AVX512F-32-NEXT: kshiftrq $5, %k7, %k0
; AVX512F-32-NEXT: kxorq %k4, %k0, %k4
; AVX512F-32-NEXT: kmovd %ecx, %k0
; AVX512F-32-NEXT: andb $1, %cl
; AVX512F-32-NEXT: kshiftlq $63, %k4, %k4
; AVX512F-32-NEXT: kshiftrq $58, %k4, %k4
-; AVX512F-32-NEXT: kxorq %k7, %k4, %k7
+; AVX512F-32-NEXT: kxorq %k4, %k7, %k7
; AVX512F-32-NEXT: kshiftrq $6, %k7, %k4
; AVX512F-32-NEXT: kxorq %k6, %k4, %k6
; AVX512F-32-NEXT: kmovd %ecx, %k4
; AVX512F-32-NEXT: shrb %bl
; AVX512F-32-NEXT: kshiftlq $63, %k6, %k6
; AVX512F-32-NEXT: kshiftrq $57, %k6, %k6
-; AVX512F-32-NEXT: kxorq %k7, %k6, %k6
+; AVX512F-32-NEXT: kxorq %k6, %k7, %k6
; AVX512F-32-NEXT: kshiftrq $7, %k6, %k7
; AVX512F-32-NEXT: kxorq %k5, %k7, %k7
; AVX512F-32-NEXT: kmovd %ebx, %k5
; AVX512F-32-NEXT: shrb $2, %dl
; AVX512F-32-NEXT: kshiftlq $63, %k7, %k7
; AVX512F-32-NEXT: kshiftrq $56, %k7, %k7
-; AVX512F-32-NEXT: kxorq %k6, %k7, %k7
+; AVX512F-32-NEXT: kxorq %k7, %k6, %k7
; AVX512F-32-NEXT: kshiftrq $8, %k7, %k6
; AVX512F-32-NEXT: kxorq %k1, %k6, %k1
; AVX512F-32-NEXT: kmovd %edx, %k6
; AVX512F-32-NEXT: shrb $3, %cl
; AVX512F-32-NEXT: kshiftlq $63, %k1, %k1
; AVX512F-32-NEXT: kshiftrq $55, %k1, %k1
-; AVX512F-32-NEXT: kxorq %k7, %k1, %k7
+; AVX512F-32-NEXT: kxorq %k1, %k7, %k7
; AVX512F-32-NEXT: kshiftrq $9, %k7, %k1
; AVX512F-32-NEXT: kxorq %k2, %k1, %k2
; AVX512F-32-NEXT: kmovd %ecx, %k1
; AVX512F-32-NEXT: shrb $4, %cl
; AVX512F-32-NEXT: kshiftlq $63, %k2, %k2
; AVX512F-32-NEXT: kshiftrq $54, %k2, %k2
-; AVX512F-32-NEXT: kxorq %k7, %k2, %k7
+; AVX512F-32-NEXT: kxorq %k2, %k7, %k7
; AVX512F-32-NEXT: kshiftrq $10, %k7, %k2
; AVX512F-32-NEXT: kxorq %k3, %k2, %k3
; AVX512F-32-NEXT: kmovd %ecx, %k2
; AVX512F-32-NEXT: shrl $12, %edx
; AVX512F-32-NEXT: kshiftlq $63, %k3, %k3
; AVX512F-32-NEXT: kshiftrq $53, %k3, %k3
-; AVX512F-32-NEXT: kxorq %k7, %k3, %k3
+; AVX512F-32-NEXT: kxorq %k3, %k7, %k3
; AVX512F-32-NEXT: kshiftrq $11, %k3, %k7
; AVX512F-32-NEXT: kxorq %k0, %k7, %k0
; AVX512F-32-NEXT: kshiftlq $63, %k0, %k0
; AVX512F-32-NEXT: kshiftrq $52, %k0, %k0
-; AVX512F-32-NEXT: kxorq %k3, %k0, %k3
+; AVX512F-32-NEXT: kxorq %k0, %k3, %k3
; AVX512F-32-NEXT: kshiftrq $12, %k3, %k0
; AVX512F-32-NEXT: kmovd %edx, %k7
; AVX512F-32-NEXT: kxorq %k7, %k0, %k7
; AVX512F-32-NEXT: shrl $14, %edi
; AVX512F-32-NEXT: kshiftlq $63, %k7, %k7
; AVX512F-32-NEXT: kshiftrq $51, %k7, %k7
-; AVX512F-32-NEXT: kxorq %k3, %k7, %k3
+; AVX512F-32-NEXT: kxorq %k7, %k3, %k3
; AVX512F-32-NEXT: kshiftrq $13, %k3, %k7
; AVX512F-32-NEXT: kxorq %k4, %k7, %k4
; AVX512F-32-NEXT: kshiftlq $63, %k4, %k4
; AVX512F-32-NEXT: kshiftrq $50, %k4, %k4
-; AVX512F-32-NEXT: kxorq %k3, %k4, %k3
+; AVX512F-32-NEXT: kxorq %k4, %k3, %k3
; AVX512F-32-NEXT: kshiftrq $14, %k3, %k4
; AVX512F-32-NEXT: kmovd %edi, %k7
; AVX512F-32-NEXT: kxorq %k7, %k4, %k4
; AVX512F-32-NEXT: kshiftlq $63, %k4, %k4
; AVX512F-32-NEXT: kshiftrq $49, %k4, %k4
-; AVX512F-32-NEXT: kxorq %k3, %k4, %k3
+; AVX512F-32-NEXT: kxorq %k4, %k3, %k3
; AVX512F-32-NEXT: kshiftrq $15, %k3, %k4
; AVX512F-32-NEXT: kmovd %esi, %k7
; AVX512F-32-NEXT: kxorq %k7, %k4, %k4
; AVX512F-32-NEXT: kshiftlq $63, %k4, %k4
; AVX512F-32-NEXT: kshiftrq $48, %k4, %k4
-; AVX512F-32-NEXT: kxorq %k3, %k4, %k3
+; AVX512F-32-NEXT: kxorq %k4, %k3, %k3
; AVX512F-32-NEXT: kshiftrq $16, %k3, %k4
; AVX512F-32-NEXT: kmovd %eax, %k7
; AVX512F-32-NEXT: kxorq %k7, %k4, %k4
; AVX512F-32-NEXT: shrb $7, %al
; AVX512F-32-NEXT: kshiftlq $63, %k4, %k4
; AVX512F-32-NEXT: kshiftrq $47, %k4, %k4
-; AVX512F-32-NEXT: kxorq %k3, %k4, %k3
+; AVX512F-32-NEXT: kxorq %k4, %k3, %k3
; AVX512F-32-NEXT: kshiftrq $17, %k3, %k4
; AVX512F-32-NEXT: kxorq %k5, %k4, %k4
; AVX512F-32-NEXT: kmovd %eax, %k5
; AVX512F-32-NEXT: movl %edx, %eax
; AVX512F-32-NEXT: kshiftlq $63, %k4, %k4
; AVX512F-32-NEXT: kshiftrq $46, %k4, %k4
-; AVX512F-32-NEXT: kxorq %k3, %k4, %k4
+; AVX512F-32-NEXT: kxorq %k4, %k3, %k4
; AVX512F-32-NEXT: kshiftrq $18, %k4, %k3
; AVX512F-32-NEXT: kxorq %k6, %k3, %k6
; AVX512F-32-NEXT: kmovd %edx, %k3
; AVX512F-32-NEXT: shrb %al
; AVX512F-32-NEXT: kshiftlq $63, %k6, %k6
; AVX512F-32-NEXT: kshiftrq $45, %k6, %k6
-; AVX512F-32-NEXT: kxorq %k4, %k6, %k6
+; AVX512F-32-NEXT: kxorq %k6, %k4, %k6
; AVX512F-32-NEXT: kshiftrq $19, %k6, %k4
; AVX512F-32-NEXT: kxorq %k1, %k4, %k1
; AVX512F-32-NEXT: kmovd %eax, %k4
; AVX512F-32-NEXT: shrb $2, %dl
; AVX512F-32-NEXT: kshiftlq $63, %k1, %k1
; AVX512F-32-NEXT: kshiftrq $44, %k1, %k1
-; AVX512F-32-NEXT: kxorq %k6, %k1, %k1
+; AVX512F-32-NEXT: kxorq %k1, %k6, %k1
; AVX512F-32-NEXT: kshiftrq $20, %k1, %k6
; AVX512F-32-NEXT: kxorq %k2, %k6, %k6
; AVX512F-32-NEXT: kmovd %edx, %k2
; AVX512F-32-NEXT: shrb $3, %cl
; AVX512F-32-NEXT: kshiftlq $63, %k6, %k6
; AVX512F-32-NEXT: kshiftrq $43, %k6, %k6
-; AVX512F-32-NEXT: kxorq %k1, %k6, %k6
+; AVX512F-32-NEXT: kxorq %k6, %k1, %k6
; AVX512F-32-NEXT: kshiftrq $21, %k6, %k1
; AVX512F-32-NEXT: kxorq %k0, %k1, %k0
; AVX512F-32-NEXT: kmovd %ecx, %k1
; AVX512F-32-NEXT: andb $1, %cl
; AVX512F-32-NEXT: kshiftlq $63, %k0, %k0
; AVX512F-32-NEXT: kshiftrq $42, %k0, %k0
-; AVX512F-32-NEXT: kxorq %k6, %k0, %k6
+; AVX512F-32-NEXT: kxorq %k0, %k6, %k6
; AVX512F-32-NEXT: kshiftrq $22, %k6, %k0
; AVX512F-32-NEXT: kxorq %k7, %k0, %k7
; AVX512F-32-NEXT: kmovd %ecx, %k0
; AVX512F-32-NEXT: shrb %dl
; AVX512F-32-NEXT: kshiftlq $63, %k7, %k7
; AVX512F-32-NEXT: kshiftrq $41, %k7, %k7
-; AVX512F-32-NEXT: kxorq %k6, %k7, %k6
+; AVX512F-32-NEXT: kxorq %k7, %k6, %k6
; AVX512F-32-NEXT: kshiftrq $23, %k6, %k7
; AVX512F-32-NEXT: kxorq %k5, %k7, %k7
; AVX512F-32-NEXT: kmovd %edx, %k5
; AVX512F-32-NEXT: shrb $2, %al
; AVX512F-32-NEXT: kshiftlq $63, %k7, %k7
; AVX512F-32-NEXT: kshiftrq $40, %k7, %k7
-; AVX512F-32-NEXT: kxorq %k6, %k7, %k7
+; AVX512F-32-NEXT: kxorq %k7, %k6, %k7
; AVX512F-32-NEXT: kshiftrq $24, %k7, %k6
; AVX512F-32-NEXT: kxorq %k3, %k6, %k3
; AVX512F-32-NEXT: kmovd %eax, %k6
; AVX512F-32-NEXT: shrb $3, %cl
; AVX512F-32-NEXT: kshiftlq $63, %k3, %k3
; AVX512F-32-NEXT: kshiftrq $39, %k3, %k3
-; AVX512F-32-NEXT: kxorq %k7, %k3, %k7
+; AVX512F-32-NEXT: kxorq %k3, %k7, %k7
; AVX512F-32-NEXT: kshiftrq $25, %k7, %k3
; AVX512F-32-NEXT: kxorq %k4, %k3, %k4
; AVX512F-32-NEXT: kmovd %ecx, %k3
; AVX512F-32-NEXT: shrb $4, %cl
; AVX512F-32-NEXT: kshiftlq $63, %k4, %k4
; AVX512F-32-NEXT: kshiftrq $38, %k4, %k4
-; AVX512F-32-NEXT: kxorq %k7, %k4, %k4
+; AVX512F-32-NEXT: kxorq %k4, %k7, %k4
; AVX512F-32-NEXT: kshiftrq $26, %k4, %k7
; AVX512F-32-NEXT: kxorq %k2, %k7, %k7
; AVX512F-32-NEXT: kmovd %ecx, %k2
; AVX512F-32-NEXT: shrl $28, %edx
; AVX512F-32-NEXT: kshiftlq $63, %k7, %k7
; AVX512F-32-NEXT: kshiftrq $37, %k7, %k7
-; AVX512F-32-NEXT: kxorq %k4, %k7, %k4
+; AVX512F-32-NEXT: kxorq %k7, %k4, %k4
; AVX512F-32-NEXT: kshiftrq $27, %k4, %k7
; AVX512F-32-NEXT: kxorq %k1, %k7, %k1
; AVX512F-32-NEXT: kshiftlq $63, %k1, %k1
; AVX512F-32-NEXT: kshiftrq $36, %k1, %k1
-; AVX512F-32-NEXT: kxorq %k4, %k1, %k1
+; AVX512F-32-NEXT: kxorq %k1, %k4, %k1
; AVX512F-32-NEXT: kshiftrq $28, %k1, %k4
; AVX512F-32-NEXT: kmovd %edx, %k7
; AVX512F-32-NEXT: kxorq %k7, %k4, %k7
; AVX512F-32-NEXT: shrl $30, %esi
; AVX512F-32-NEXT: kshiftlq $63, %k7, %k7
; AVX512F-32-NEXT: kshiftrq $35, %k7, %k7
-; AVX512F-32-NEXT: kxorq %k1, %k7, %k1
+; AVX512F-32-NEXT: kxorq %k7, %k1, %k1
; AVX512F-32-NEXT: kshiftrq $29, %k1, %k7
; AVX512F-32-NEXT: kxorq %k0, %k7, %k0
; AVX512F-32-NEXT: kshiftlq $63, %k0, %k0
; AVX512F-32-NEXT: kshiftrq $34, %k0, %k0
-; AVX512F-32-NEXT: kxorq %k1, %k0, %k0
+; AVX512F-32-NEXT: kxorq %k0, %k1, %k0
; AVX512F-32-NEXT: kshiftrq $30, %k0, %k1
; AVX512F-32-NEXT: kmovd %esi, %k7
; AVX512F-32-NEXT: kxorq %k7, %k1, %k1
; AVX512F-32-NEXT: kshiftlq $63, %k1, %k1
; AVX512F-32-NEXT: kshiftrq $33, %k1, %k1
-; AVX512F-32-NEXT: kxorq %k0, %k1, %k0
+; AVX512F-32-NEXT: kxorq %k1, %k0, %k0
; AVX512F-32-NEXT: kshiftrq $31, %k0, %k1
; AVX512F-32-NEXT: kmovd %ecx, %k7
; AVX512F-32-NEXT: kxorq %k7, %k1, %k1
; AVX512F-32-NEXT: kshiftlq $63, %k1, %k1
; AVX512F-32-NEXT: kshiftrq $32, %k1, %k1
-; AVX512F-32-NEXT: kxorq %k0, %k1, %k0
+; AVX512F-32-NEXT: kxorq %k1, %k0, %k0
; AVX512F-32-NEXT: kshiftrq $32, %k0, %k1
; AVX512F-32-NEXT: kmovd %ebx, %k7
; AVX512F-32-NEXT: kxorq %k7, %k1, %k1
; AVX512F-32-NEXT: shrb $7, %cl
; AVX512F-32-NEXT: kshiftlq $63, %k1, %k1
; AVX512F-32-NEXT: kshiftrq $31, %k1, %k1
-; AVX512F-32-NEXT: kxorq %k0, %k1, %k0
+; AVX512F-32-NEXT: kxorq %k1, %k0, %k0
; AVX512F-32-NEXT: kshiftrq $33, %k0, %k1
; AVX512F-32-NEXT: kxorq %k5, %k1, %k1
; AVX512F-32-NEXT: kshiftlq $63, %k1, %k1
; AVX512F-32-NEXT: kshiftrq $30, %k1, %k1
-; AVX512F-32-NEXT: kxorq %k0, %k1, %k0
+; AVX512F-32-NEXT: kxorq %k1, %k0, %k0
; AVX512F-32-NEXT: kshiftrq $34, %k0, %k1
; AVX512F-32-NEXT: kxorq %k6, %k1, %k5
; AVX512F-32-NEXT: kmovd %ecx, %k6
; AVX512F-32-NEXT: shrb %cl
; AVX512F-32-NEXT: kshiftlq $63, %k5, %k5
; AVX512F-32-NEXT: kshiftrq $29, %k5, %k5
-; AVX512F-32-NEXT: kxorq %k0, %k5, %k5
+; AVX512F-32-NEXT: kxorq %k5, %k0, %k5
; AVX512F-32-NEXT: kshiftrq $35, %k5, %k0
; AVX512F-32-NEXT: kxorq %k3, %k0, %k3
; AVX512F-32-NEXT: kmovd %ecx, %k0
; AVX512F-32-NEXT: shrb $2, %al
; AVX512F-32-NEXT: kshiftlq $63, %k3, %k3
; AVX512F-32-NEXT: kshiftrq $28, %k3, %k3
-; AVX512F-32-NEXT: kxorq %k5, %k3, %k5
+; AVX512F-32-NEXT: kxorq %k3, %k5, %k5
; AVX512F-32-NEXT: kshiftrq $36, %k5, %k3
; AVX512F-32-NEXT: kxorq %k2, %k3, %k2
; AVX512F-32-NEXT: kmovd %eax, %k3
; AVX512F-32-NEXT: shrb $3, %cl
; AVX512F-32-NEXT: kshiftlq $63, %k2, %k2
; AVX512F-32-NEXT: kshiftrq $27, %k2, %k2
-; AVX512F-32-NEXT: kxorq %k5, %k2, %k2
+; AVX512F-32-NEXT: kxorq %k2, %k5, %k2
; AVX512F-32-NEXT: kshiftrq $37, %k2, %k5
; AVX512F-32-NEXT: kxorq %k4, %k5, %k5
; AVX512F-32-NEXT: kmovd %ecx, %k4
; AVX512F-32-NEXT: andb $1, %cl
; AVX512F-32-NEXT: kshiftlq $63, %k5, %k5
; AVX512F-32-NEXT: kshiftrq $26, %k5, %k5
-; AVX512F-32-NEXT: kxorq %k2, %k5, %k2
+; AVX512F-32-NEXT: kxorq %k5, %k2, %k2
; AVX512F-32-NEXT: kshiftrq $38, %k2, %k5
; AVX512F-32-NEXT: kxorq %k7, %k5, %k7
; AVX512F-32-NEXT: kmovd %ecx, %k5
; AVX512F-32-NEXT: shrb %dl
; AVX512F-32-NEXT: kshiftlq $63, %k7, %k7
; AVX512F-32-NEXT: kshiftrq $25, %k7, %k7
-; AVX512F-32-NEXT: kxorq %k2, %k7, %k7
+; AVX512F-32-NEXT: kxorq %k7, %k2, %k7
; AVX512F-32-NEXT: kshiftrq $39, %k7, %k2
; AVX512F-32-NEXT: kxorq %k6, %k2, %k6
; AVX512F-32-NEXT: kmovd %edx, %k2
; AVX512F-32-NEXT: shrb $2, %cl
; AVX512F-32-NEXT: kshiftlq $63, %k6, %k6
; AVX512F-32-NEXT: kshiftrq $24, %k6, %k6
-; AVX512F-32-NEXT: kxorq %k7, %k6, %k6
+; AVX512F-32-NEXT: kxorq %k6, %k7, %k6
; AVX512F-32-NEXT: kshiftrq $40, %k6, %k7
; AVX512F-32-NEXT: kxorq %k1, %k7, %k7
; AVX512F-32-NEXT: kmovd %ecx, %k1
; AVX512F-32-NEXT: shrl $12, %ecx
; AVX512F-32-NEXT: kshiftlq $63, %k7, %k7
; AVX512F-32-NEXT: kshiftrq $23, %k7, %k7
-; AVX512F-32-NEXT: kxorq %k6, %k7, %k6
+; AVX512F-32-NEXT: kxorq %k7, %k6, %k6
; AVX512F-32-NEXT: kshiftrq $41, %k6, %k7
; AVX512F-32-NEXT: kxorq %k0, %k7, %k0
; AVX512F-32-NEXT: kmovd %ecx, %k1
; AVX512F-32-NEXT: shrl $14, %edi
; AVX512F-32-NEXT: kshiftlq $63, %k0, %k0
; AVX512F-32-NEXT: kshiftrq $22, %k0, %k0
-; AVX512F-32-NEXT: kxorq %k6, %k0, %k0
+; AVX512F-32-NEXT: kxorq %k0, %k6, %k0
; AVX512F-32-NEXT: kshiftrq $42, %k0, %k6
; AVX512F-32-NEXT: kxorq %k3, %k6, %k3
; AVX512F-32-NEXT: kmovd %edi, %k7
; AVX512F-32-NEXT: shrl $15, %esi
; AVX512F-32-NEXT: kshiftlq $63, %k3, %k3
; AVX512F-32-NEXT: kshiftrq $21, %k3, %k3
-; AVX512F-32-NEXT: kxorq %k0, %k3, %k0
+; AVX512F-32-NEXT: kxorq %k3, %k0, %k0
; AVX512F-32-NEXT: kshiftrq $43, %k0, %k3
; AVX512F-32-NEXT: kxorq %k4, %k3, %k3
; AVX512F-32-NEXT: kmovd %esi, %k6
; AVX512F-32-NEXT: shrb $3, %dl
; AVX512F-32-NEXT: kshiftlq $63, %k3, %k3
; AVX512F-32-NEXT: kshiftrq $20, %k3, %k3
-; AVX512F-32-NEXT: kxorq %k0, %k3, %k3
+; AVX512F-32-NEXT: kxorq %k3, %k0, %k3
; AVX512F-32-NEXT: kshiftrq $44, %k3, %k0
; AVX512F-32-NEXT: kxorq %k1, %k0, %k1
; AVX512F-32-NEXT: kmovd %edx, %k0
; AVX512F-32-NEXT: shrb $4, %cl
; AVX512F-32-NEXT: kshiftlq $63, %k1, %k1
; AVX512F-32-NEXT: kshiftrq $19, %k1, %k1
-; AVX512F-32-NEXT: kxorq %k3, %k1, %k1
+; AVX512F-32-NEXT: kxorq %k1, %k3, %k1
; AVX512F-32-NEXT: kshiftrq $45, %k1, %k3
; AVX512F-32-NEXT: kxorq %k5, %k3, %k4
; AVX512F-32-NEXT: kmovd %ecx, %k3
; AVX512F-32-NEXT: andb $1, %cl
; AVX512F-32-NEXT: kshiftlq $63, %k4, %k4
; AVX512F-32-NEXT: kshiftrq $18, %k4, %k4
-; AVX512F-32-NEXT: kxorq %k1, %k4, %k1
+; AVX512F-32-NEXT: kxorq %k4, %k1, %k1
; AVX512F-32-NEXT: kshiftrq $46, %k1, %k4
; AVX512F-32-NEXT: kxorq %k7, %k4, %k5
; AVX512F-32-NEXT: kmovd %ecx, %k4
; AVX512F-32-NEXT: shrb $6, %cl
; AVX512F-32-NEXT: kshiftlq $63, %k5, %k5
; AVX512F-32-NEXT: kshiftrq $17, %k5, %k5
-; AVX512F-32-NEXT: kxorq %k1, %k5, %k1
+; AVX512F-32-NEXT: kxorq %k5, %k1, %k1
; AVX512F-32-NEXT: kshiftrq $47, %k1, %k5
; AVX512F-32-NEXT: kxorq %k6, %k5, %k5
; AVX512F-32-NEXT: kshiftlq $63, %k5, %k5
; AVX512F-32-NEXT: kshiftrq $16, %k5, %k5
-; AVX512F-32-NEXT: kxorq %k1, %k5, %k1
+; AVX512F-32-NEXT: kxorq %k5, %k1, %k1
; AVX512F-32-NEXT: kshiftrq $48, %k1, %k5
; AVX512F-32-NEXT: kmovd %eax, %k6
; AVX512F-32-NEXT: kxorq %k6, %k5, %k6
; AVX512F-32-NEXT: shrb $7, %al
; AVX512F-32-NEXT: kshiftlq $63, %k6, %k6
; AVX512F-32-NEXT: kshiftrq $15, %k6, %k6
-; AVX512F-32-NEXT: kxorq %k1, %k6, %k1
+; AVX512F-32-NEXT: kxorq %k6, %k1, %k1
; AVX512F-32-NEXT: kshiftrq $49, %k1, %k6
; AVX512F-32-NEXT: kxorq %k2, %k6, %k6
; AVX512F-32-NEXT: kmovd %eax, %k2
; AVX512F-32-NEXT: movl %edx, %eax
; AVX512F-32-NEXT: kshiftlq $63, %k6, %k6
; AVX512F-32-NEXT: kshiftrq $14, %k6, %k6
-; AVX512F-32-NEXT: kxorq %k1, %k6, %k6
+; AVX512F-32-NEXT: kxorq %k6, %k1, %k6
; AVX512F-32-NEXT: kshiftrq $50, %k6, %k1
; AVX512F-32-NEXT: kmovq {{[0-9]+}}(%esp), %k7 # 8-byte Reload
; AVX512F-32-NEXT: kxorq %k7, %k1, %k7
; AVX512F-32-NEXT: shrb %al
; AVX512F-32-NEXT: kshiftlq $63, %k7, %k7
; AVX512F-32-NEXT: kshiftrq $13, %k7, %k7
-; AVX512F-32-NEXT: kxorq %k6, %k7, %k6
+; AVX512F-32-NEXT: kxorq %k7, %k6, %k6
; AVX512F-32-NEXT: kshiftrq $51, %k6, %k7
; AVX512F-32-NEXT: kxorq %k0, %k7, %k7
; AVX512F-32-NEXT: kmovd %eax, %k0
; AVX512F-32-NEXT: shrb $2, %dl
; AVX512F-32-NEXT: kshiftlq $63, %k7, %k7
; AVX512F-32-NEXT: kshiftrq $12, %k7, %k7
-; AVX512F-32-NEXT: kxorq %k6, %k7, %k6
+; AVX512F-32-NEXT: kxorq %k7, %k6, %k6
; AVX512F-32-NEXT: kshiftrq $52, %k6, %k7
; AVX512F-32-NEXT: kxorq %k3, %k7, %k7
; AVX512F-32-NEXT: kmovd %edx, %k3
; AVX512F-32-NEXT: shrb $3, %al
; AVX512F-32-NEXT: kshiftlq $63, %k7, %k7
; AVX512F-32-NEXT: kshiftrq $11, %k7, %k7
-; AVX512F-32-NEXT: kxorq %k6, %k7, %k6
+; AVX512F-32-NEXT: kxorq %k7, %k6, %k6
; AVX512F-32-NEXT: kshiftrq $53, %k6, %k7
; AVX512F-32-NEXT: kxorq %k4, %k7, %k7
; AVX512F-32-NEXT: kmovd %eax, %k4
; AVX512F-32-NEXT: andb $1, %al
; AVX512F-32-NEXT: kshiftlq $63, %k7, %k7
; AVX512F-32-NEXT: kshiftrq $10, %k7, %k7
-; AVX512F-32-NEXT: kxorq %k6, %k7, %k6
+; AVX512F-32-NEXT: kxorq %k7, %k6, %k6
; AVX512F-32-NEXT: kshiftrq $54, %k6, %k7
; AVX512F-32-NEXT: kxorq %k5, %k7, %k7
; AVX512F-32-NEXT: kmovd %eax, %k5
; AVX512F-32-NEXT: kshiftlq $63, %k7, %k7
; AVX512F-32-NEXT: kshiftrq $9, %k7, %k7
-; AVX512F-32-NEXT: kxorq %k6, %k7, %k6
+; AVX512F-32-NEXT: kxorq %k7, %k6, %k6
; AVX512F-32-NEXT: kshiftrq $55, %k6, %k7
; AVX512F-32-NEXT: kxorq %k2, %k7, %k2
; AVX512F-32-NEXT: kshiftlq $63, %k2, %k2
; AVX512F-32-NEXT: kshiftrq $8, %k2, %k2
-; AVX512F-32-NEXT: kxorq %k6, %k2, %k2
+; AVX512F-32-NEXT: kxorq %k2, %k6, %k2
; AVX512F-32-NEXT: kshiftrq $56, %k2, %k6
; AVX512F-32-NEXT: kxorq %k1, %k6, %k1
; AVX512F-32-NEXT: kshiftlq $63, %k1, %k1
; AVX512F-32-NEXT: kshiftrq $7, %k1, %k1
-; AVX512F-32-NEXT: kxorq %k2, %k1, %k1
+; AVX512F-32-NEXT: kxorq %k1, %k2, %k1
; AVX512F-32-NEXT: kshiftrq $57, %k1, %k2
; AVX512F-32-NEXT: kxorq %k0, %k2, %k0
; AVX512F-32-NEXT: kshiftlq $63, %k0, %k0
; AVX512F-32-NEXT: kshiftrq $6, %k0, %k0
-; AVX512F-32-NEXT: kxorq %k1, %k0, %k0
+; AVX512F-32-NEXT: kxorq %k0, %k1, %k0
; AVX512F-32-NEXT: kshiftrq $58, %k0, %k1
; AVX512F-32-NEXT: kxorq %k3, %k1, %k1
; AVX512F-32-NEXT: movl %ebx, %eax
; AVX512F-32-NEXT: shrl $28, %eax
; AVX512F-32-NEXT: kshiftlq $63, %k1, %k1
; AVX512F-32-NEXT: kshiftrq $5, %k1, %k1
-; AVX512F-32-NEXT: kxorq %k0, %k1, %k0
+; AVX512F-32-NEXT: kxorq %k1, %k0, %k0
; AVX512F-32-NEXT: kshiftrq $59, %k0, %k1
; AVX512F-32-NEXT: kxorq %k4, %k1, %k1
; AVX512F-32-NEXT: kshiftlq $63, %k1, %k1
; AVX512F-32-NEXT: kshiftrq $4, %k1, %k1
-; AVX512F-32-NEXT: kxorq %k0, %k1, %k0
+; AVX512F-32-NEXT: kxorq %k1, %k0, %k0
; AVX512F-32-NEXT: kshiftrq $60, %k0, %k1
; AVX512F-32-NEXT: kmovd %eax, %k2
; AVX512F-32-NEXT: kxorq %k2, %k1, %k1
; AVX512F-32-NEXT: shrl $30, %ecx
; AVX512F-32-NEXT: kshiftlq $63, %k1, %k1
; AVX512F-32-NEXT: kshiftrq $3, %k1, %k1
-; AVX512F-32-NEXT: kxorq %k0, %k1, %k0
+; AVX512F-32-NEXT: kxorq %k1, %k0, %k0
; AVX512F-32-NEXT: kshiftrq $61, %k0, %k1
; AVX512F-32-NEXT: kxorq %k5, %k1, %k1
; AVX512F-32-NEXT: kshiftlq $63, %k1, %k1
; AVX512F-32-NEXT: kshiftrq $2, %k1, %k1
-; AVX512F-32-NEXT: kxorq %k0, %k1, %k0
+; AVX512F-32-NEXT: kxorq %k1, %k0, %k0
; AVX512F-32-NEXT: kshiftrq $62, %k0, %k1
; AVX512F-32-NEXT: kmovd %ecx, %k2
; AVX512F-32-NEXT: kxorq %k2, %k1, %k1
; AVX512F-32-NEXT: kshiftlq $63, %k1, %k1
; AVX512F-32-NEXT: kshiftrq $1, %k1, %k1
-; AVX512F-32-NEXT: kxorq %k0, %k1, %k0
+; AVX512F-32-NEXT: kxorq %k1, %k0, %k0
; AVX512F-32-NEXT: kshiftlq $1, %k0, %k0
; AVX512F-32-NEXT: kshiftrq $1, %k0, %k0
; AVX512F-32-NEXT: kmovd %eax, %k1