Lines Matching +full:4 +full:b

18 .irp b, 0, 1, 2, 3, 24, 25, 26, 27, 28, 29, 30, 31
19 .set .Lv\b\().4s, \b
40 ext T0.16b, m1.16b, m1.16b, #8; \
45 eor T0.16b, T0.16b, T1.16b; \
46 ext T1.16b, RZERO.16b, T0.16b, #8; \
47 ext T0.16b, T0.16b, RZERO.16b, #8; \
48 eor r0.16b, r0.16b, T1.16b; \
49 eor r1.16b, r1.16b, T0.16b;
55 ext T0.16b, m1.16b, m1.16b, #8; \
56 ext T2.16b, m3.16b, m3.16b, #8; \
57 ext T4.16b, m5.16b, m5.16b, #8; \
58 ext T6.16b, m7.16b, m7.16b, #8; \
75 eor T0.16b, T0.16b, T1.16b; \
76 eor T2.16b, T2.16b, T3.16b; \
77 eor T4.16b, T4.16b, T5.16b; \
78 eor T6.16b, T6.16b, T7.16b; \
79 ext T1.16b, RZERO.16b, T0.16b, #8; \
80 ext T3.16b, RZERO.16b, T2.16b, #8; \
81 ext T5.16b, RZERO.16b, T4.16b, #8; \
82 ext T7.16b, RZERO.16b, T6.16b, #8; \
83 ext T0.16b, T0.16b, RZERO.16b, #8; \
84 ext T2.16b, T2.16b, RZERO.16b, #8; \
85 ext T4.16b, T4.16b, RZERO.16b, #8; \
86 ext T6.16b, T6.16b, RZERO.16b, #8; \
87 eor r0.16b, r0.16b, T1.16b; \
88 eor r2.16b, r2.16b, T3.16b; \
89 eor r4.16b, r4.16b, T5.16b; \
90 eor r6.16b, r6.16b, T7.16b; \
91 eor r1.16b, r1.16b, T0.16b; \
92 eor r3.16b, r3.16b, T2.16b; \
93 eor r5.16b, r5.16b, T4.16b; \
94 eor r7.16b, r7.16b, T6.16b;
102 ext T1.16b, T0.16b, RZERO.16b, #8; \
103 ext T0.16b, RZERO.16b, T0.16b, #8; \
104 eor r1.16b, r1.16b, T1.16b; \
105 eor r0.16b, r0.16b, T0.16b; \
107 eor a.16b, r0.16b, T0.16b;
110 rev32 b0.16b, b0.16b; \
111 ext T0.16b, m1.16b, m1.16b, #8; \
112 sm4e b0.4s, v24.4s; \
114 sm4e b0.4s, v25.4s; \
116 sm4e b0.4s, v26.4s; \
118 sm4e b0.4s, v27.4s; \
120 sm4e b0.4s, v28.4s; \
121 eor T0.16b, T0.16b, T1.16b; \
122 sm4e b0.4s, v29.4s; \
123 ext T1.16b, RZERO.16b, T0.16b, #8; \
124 sm4e b0.4s, v30.4s; \
125 ext T0.16b, T0.16b, RZERO.16b, #8; \
126 sm4e b0.4s, v31.4s; \
127 eor r0.16b, r0.16b, T1.16b; \
128 rev64 b0.4s, b0.4s; \
129 eor r1.16b, r1.16b, T0.16b; \
130 ext b0.16b, b0.16b, b0.16b, #8; \
131 rev32 b0.16b, b0.16b;
137 rev32 b0.16b, b0.16b; \
138 rev32 b1.16b, b1.16b; \
139 rev32 b2.16b, b2.16b; \
140 ext T0.16b, m1.16b, m1.16b, #8; \
141 ext T2.16b, m3.16b, m3.16b, #8; \
142 ext T4.16b, m5.16b, m5.16b, #8; \
143 sm4e b0.4s, v24.4s; \
144 sm4e b1.4s, v24.4s; \
145 sm4e b2.4s, v24.4s; \
149 sm4e b0.4s, v25.4s; \
150 sm4e b1.4s, v25.4s; \
151 sm4e b2.4s, v25.4s; \
155 sm4e b0.4s, v26.4s; \
156 sm4e b1.4s, v26.4s; \
157 sm4e b2.4s, v26.4s; \
161 sm4e b0.4s, v27.4s; \
162 sm4e b1.4s, v27.4s; \
163 sm4e b2.4s, v27.4s; \
167 sm4e b0.4s, v28.4s; \
168 sm4e b1.4s, v28.4s; \
169 sm4e b2.4s, v28.4s; \
170 eor T0.16b, T0.16b, T1.16b; \
171 eor T2.16b, T2.16b, T3.16b; \
172 eor T4.16b, T4.16b, T5.16b; \
173 sm4e b0.4s, v29.4s; \
174 sm4e b1.4s, v29.4s; \
175 sm4e b2.4s, v29.4s; \
176 ext T1.16b, RZERO.16b, T0.16b, #8; \
177 ext T3.16b, RZERO.16b, T2.16b, #8; \
178 ext T5.16b, RZERO.16b, T4.16b, #8; \
179 sm4e b0.4s, v30.4s; \
180 sm4e b1.4s, v30.4s; \
181 sm4e b2.4s, v30.4s; \
182 ext T0.16b, T0.16b, RZERO.16b, #8; \
183 ext T2.16b, T2.16b, RZERO.16b, #8; \
184 ext T4.16b, T4.16b, RZERO.16b, #8; \
185 sm4e b0.4s, v31.4s; \
186 sm4e b1.4s, v31.4s; \
187 sm4e b2.4s, v31.4s; \
188 eor r0.16b, r0.16b, T1.16b; \
189 eor r2.16b, r2.16b, T3.16b; \
190 eor r4.16b, r4.16b, T5.16b; \
191 rev64 b0.4s, b0.4s; \
192 rev64 b1.4s, b1.4s; \
193 rev64 b2.4s, b2.4s; \
194 eor r1.16b, r1.16b, T0.16b; \
195 eor r3.16b, r3.16b, T2.16b; \
196 eor r5.16b, r5.16b, T4.16b; \
197 ext b0.16b, b0.16b, b0.16b, #8; \
198 ext b1.16b, b1.16b, b1.16b, #8; \
199 ext b2.16b, b2.16b, b2.16b, #8; \
200 eor r0.16b, r0.16b, r2.16b; \
201 eor r1.16b, r1.16b, r3.16b; \
202 rev32 b0.16b, b0.16b; \
203 rev32 b1.16b, b1.16b; \
204 rev32 b2.16b, b2.16b; \
205 eor r0.16b, r0.16b, r4.16b; \
206 eor r1.16b, r1.16b, r5.16b;
213 rev64 vctr.16b, vctr.16b;
216 ld1 {vlen.16b}, [x7]; \
223 rbit vlen.16b, vlen.16b; \
224 rev64 vctr0.16b, vctr0.16b; \
226 eor RHASH.16b, RHASH.16b, vlen.16b; \
230 rbit RHASH.16b, RHASH.16b; \
231 eor RHASH.16b, RHASH.16b, vctr0.16b;
272 eor RZERO.16b, RZERO.16b, RZERO.16b
275 rev32 v0.16b, RZERO.16b
279 rbit RH1.16b, v0.16b
289 /* H ^ 4 */
293 st1 {RH1.16b-RH4.16b}, [x1]
306 ld1 {RH1.16b-RH4.16b}, [x0]
308 ld1 {RHASH.16b}, [x1]
309 rbit RHASH.16b, RHASH.16b
314 eor RZERO.16b, RZERO.16b, RZERO.16b
317 cmp w3, #4
320 sub w3, w3, #4
322 ld1 {v0.16b-v3.16b}, [x2], #64
324 rbit v0.16b, v0.16b
325 rbit v1.16b, v1.16b
326 rbit v2.16b, v2.16b
327 rbit v3.16b, v3.16b
330 * (in0 ^ HASH) * H^4 => rr0:rr1
335 eor RHASH.16b, RHASH.16b, v0.16b
342 eor RR0.16b, RR0.16b, RR2.16b
343 eor RR1.16b, RR1.16b, RR3.16b
344 eor RR0.16b, RR0.16b, RR4.16b
345 eor RR1.16b, RR1.16b, RR5.16b
346 eor RR0.16b, RR0.16b, RR6.16b
347 eor RR1.16b, RR1.16b, RR7.16b
352 b .Lghash_loop_4x
357 ld1 {v0.16b}, [x2], #16
358 rbit v0.16b, v0.16b
359 eor RHASH.16b, RHASH.16b, v0.16b
367 rbit RHASH.16b, RHASH.16b
391 ld1 {RH1.16b-RH4.16b}, [x6]
393 ld1 {RHASH.16b}, [x5]
394 rbit RHASH.16b, RHASH.16b
399 eor RZERO.16b, RZERO.16b, RZERO.16b
404 cmp w4, #(4 * 16)
407 sub w4, w4, #(4 * 16)
415 ld1 {RTMP0.16b-RTMP3.16b}, [x2], #64
419 eor v0.16b, v0.16b, RTMP0.16b
420 eor v1.16b, v1.16b, RTMP1.16b
421 eor v2.16b, v2.16b, RTMP2.16b
422 eor v3.16b, v3.16b, RTMP3.16b
423 st1 {v0.16b-v3.16b}, [x1], #64
427 rbit v0.16b, v0.16b
428 rbit v1.16b, v1.16b
429 rbit v2.16b, v2.16b
430 rbit v3.16b, v3.16b
433 * (in0 ^ HASH) * H^4 => rr0:rr1
438 eor RHASH.16b, RHASH.16b, v0.16b
445 eor RR0.16b, RR0.16b, RR2.16b
446 eor RR1.16b, RR1.16b, RR3.16b
447 eor RR0.16b, RR0.16b, RR4.16b
448 eor RR1.16b, RR1.16b, RR5.16b
449 eor RR0.16b, RR0.16b, RR6.16b
450 eor RR1.16b, RR1.16b, RR7.16b
455 b .Lgcm_enc_loop_4x
466 ld1 {RTMP0.16b}, [x2], #16
470 eor v0.16b, v0.16b, RTMP0.16b
471 st1 {v0.16b}, [x1], #16
474 rbit v0.16b, v0.16b
475 eor RHASH.16b, RHASH.16b, v0.16b
480 b .Lgcm_enc_loop_1x
491 ld1 {v3.16b}, [x0]
496 umov w6, v0.b[0] /* get top crypted byte */
501 ext v0.16b, v0.16b, v0.16b, #1
503 ins v0.b[15], w6
509 tbl v0.16b, {v0.16b}, v3.16b
512 rbit v0.16b, v0.16b
513 eor RHASH.16b, RHASH.16b, v0.16b
522 b .Lgcm_enc_ret
530 rbit RHASH.16b, RHASH.16b
602 ld1 {RH1.16b-RH3.16b}, [x6]
604 ld1 {RHASH.16b}, [x5]
605 rbit RHASH.16b, RHASH.16b
610 eor RZERO.16b, RZERO.16b, RZERO.16b
620 ld1 {v3.16b-v5.16b}, [x2], #(3 * 16)
624 rbit v6.16b, v3.16b
626 rbit v7.16b, v4.16b
628 rbit v8.16b, v5.16b
630 eor RHASH.16b, RHASH.16b, v6.16b
638 eor v0.16b, v0.16b, v3.16b
639 eor v1.16b, v1.16b, v4.16b
640 eor v2.16b, v2.16b, v5.16b
644 st1 {v0.16b-v2.16b}, [x1], #(3 * 16)
647 b .Lgcm_dec_loop_3x
655 ld1 {v3.16b}, [x2], #16
659 rbit v6.16b, v3.16b
661 eor RHASH.16b, RHASH.16b, v6.16b
665 eor v0.16b, v0.16b, v3.16b
669 st1 {v0.16b}, [x1], #16
672 b .Lgcm_dec_loop_1x
683 ld1 {v3.16b}, [x0]
688 umov w6, v0.b[0] /* get top crypted byte */
693 ext v0.16b, v0.16b, v0.16b, #1
695 ins v0.b[15], w0
701 tbl v0.16b, {v0.16b}, v3.16b
704 rbit v0.16b, v0.16b
705 eor RHASH.16b, RHASH.16b, v0.16b
714 b .Lgcm_dec_ret
722 rbit RHASH.16b, RHASH.16b
732 .align 4