Lines Matching refs:x4
66 #define roundsm32(x0, x1, x2, x3, x4, x5, x6, x7, t0, t1, t2, t3, t4, t5, t6, \ argument
86 vpshufb t4, x4, x4; \
101 filter_8bit(x4, t5, t6, t7, t4); \
121 vextracti128 $1, x4, t2##_x; \
133 vaesenclast t4##_x, x4##_x, x4##_x; \
135 vinserti128 $1, t2##_x, x4, x4; \
155 filter_8bit(x4, t4, t5, t7, t2); \
167 vpxor x4, x3, x3; \
175 vpxor x2, x4, x4; \
185 vpxor x4, x1, x1; \
189 vpxor x3, x4, x4; \
212 vpxor t3, x4, x4; \
213 vpxor 0 * 32(mem_cd), x4, x4; \
250 #define two_roundsm32(x0, x1, x2, x3, x4, x5, x6, x7, y0, y1, y2, y3, y4, y5, \ argument
259 vmovdqu x4, 0 * 32(mem_cd); \
267 store_ab(x0, x1, x2, x3, x4, x5, x6, x7, mem_ab);
269 #define dummy_store(x0, x1, x2, x3, x4, x5, x6, x7, mem_ab) /* do nothing */ argument
271 #define store_ab_state(x0, x1, x2, x3, x4, x5, x6, x7, mem_ab) \ argument
273 vmovdqu x4, 4 * 32(mem_ab); \
282 #define enc_rounds32(x0, x1, x2, x3, x4, x5, x6, x7, y0, y1, y2, y3, y4, y5, \ argument
284 two_roundsm32(x0, x1, x2, x3, x4, x5, x6, x7, y0, y1, y2, y3, y4, y5, \
286 two_roundsm32(x0, x1, x2, x3, x4, x5, x6, x7, y0, y1, y2, y3, y4, y5, \
288 two_roundsm32(x0, x1, x2, x3, x4, x5, x6, x7, y0, y1, y2, y3, y4, y5, \
291 #define dec_rounds32(x0, x1, x2, x3, x4, x5, x6, x7, y0, y1, y2, y3, y4, y5, \ argument
293 two_roundsm32(x0, x1, x2, x3, x4, x5, x6, x7, y0, y1, y2, y3, y4, y5, \
295 two_roundsm32(x0, x1, x2, x3, x4, x5, x6, x7, y0, y1, y2, y3, y4, y5, \
297 two_roundsm32(x0, x1, x2, x3, x4, x5, x6, x7, y0, y1, y2, y3, y4, y5, \
520 #define inpack32_pre(x0, x1, x2, x3, x4, x5, x6, x7, y0, y1, y2, y3, y4, y5, \ argument
536 vpxor 11 * 32(rio), x0, x4; \
543 #define inpack32_post(x0, x1, x2, x3, x4, x5, x6, x7, y0, y1, y2, y3, y4, y5, \ argument
545 byteslice_16x16b_fast(x0, x1, x2, x3, x4, x5, x6, x7, y0, y1, y2, y3, \
552 vmovdqu x4, 4 * 32(mem_ab); \
566 #define outunpack32(x0, x1, x2, x3, x4, x5, x6, x7, y0, y1, y2, y3, y4, \ argument
568 byteslice_16x16b_fast(y0, y4, x0, x4, y1, y5, x1, x5, y2, y6, x2, x6, \
587 vpxor x0, x4, x4; \
593 #define write_output(x0, x1, x2, x3, x4, x5, x6, x7, y0, y1, y2, y3, y4, y5, \ argument
599 vmovdqu x4, 4 * 32(rio); \