Lines Matching +full:0 +full:x32
48 // Multiply 32x32 => 64 and accumulate
49 vpshufd $0x10, T0, T4
50 vpshufd $0x32, T0, T0
51 vpshufd $0x10, T1, T5
52 vpshufd $0x32, T1, T1
53 vpshufd $0x10, T2, T6
54 vpshufd $0x32, T2, T2
55 vpshufd $0x10, T3, T7
56 vpshufd $0x32, T3, T3
71 * It's guaranteed that message_len % 16 == 0.
75 vmovdqu 0x00(KEY), K0
76 vmovdqu 0x10(KEY), K1
77 add $0x20, KEY
83 sub $0x40, MESSAGE_LEN
87 vmovdqu 0x00(KEY), K2
88 vmovdqu 0x10(KEY), K3
91 vmovdqu 0x20(MESSAGE), T3
92 vmovdqu 0x20(KEY), K0
93 vmovdqu 0x30(KEY), K1
96 add $0x40, MESSAGE
97 add $0x40, KEY
98 sub $0x40, MESSAGE_LEN
102 and $0x3f, MESSAGE_LEN
105 cmp $0x20, MESSAGE_LEN
110 vmovdqu 0x00(KEY), K2
111 vmovdqu 0x10(KEY), K3
113 add $0x20, MESSAGE
114 add $0x20, KEY
115 sub $0x20, MESSAGE_LEN
125 vmovdqu 0x00(KEY), K2_XMM
126 vmovdqu 0x10(KEY), K3_XMM
132 // PASS0_SUMS is (0A 0B 0C 0D)
137 // (0A + 0B + 0C + 0D,
143 vpunpcklqdq PASS1_SUMS, PASS0_SUMS, T0 // T0 = (0A 1A 0C 1C)
144 vpunpckhqdq PASS1_SUMS, PASS0_SUMS, T1 // T1 = (0B 1B 0D 1D)
148 vinserti128 $0x1, T2_XMM, T0, T4 // T4 = (0A 1A 2A 3A)
149 vinserti128 $0x1, T3_XMM, T1, T5 // T5 = (0B 1B 2B 3B)
150 vperm2i128 $0x31, T2, T0, T0 // T0 = (0C 1C 2C 3C)
151 vperm2i128 $0x31, T3, T1, T1 // T1 = (0D 1D 2D 3D)