Lines Matching full:i
104 int i; \
106 for (i = 0; i < (128 / BITS); i++) { \
107 const int32_t a = (int##BITS##_t)s390_vec_read_element##BITS(v2, i); \
108 const int32_t b = (int##BITS##_t)s390_vec_read_element##BITS(v3, i); \
110 s390_vec_write_element##BITS(v1, i, (a + b + 1) >> 1); \
120 int i; \
122 for (i = 0; i < (128 / BITS); i++) { \
123 const uint##BITS##_t a = s390_vec_read_element##BITS(v2, i); \
124 const uint##BITS##_t b = s390_vec_read_element##BITS(v3, i); \
126 s390_vec_write_element##BITS(v1, i, (a + b + 1) >> 1); \
135 int i; \
137 for (i = 0; i < (128 / BITS); i++) { \
138 const uint##BITS##_t a = s390_vec_read_element##BITS(v2, i); \
140 s390_vec_write_element##BITS(v1, i, clz32(a) - 32 + BITS); \
149 int i; \
151 for (i = 0; i < (128 / BITS); i++) { \
152 const uint##BITS##_t a = s390_vec_read_element##BITS(v2, i); \
154 s390_vec_write_element##BITS(v1, i, a ? ctz32(a) : BITS); \
266 int i; \
268 for (i = 0; i < (128 / BITS); i++) { \
269 const uint##BITS##_t a = s390_vec_read_element##BITS(v2, i); \
270 const uint##BITS##_t b = s390_vec_read_element##BITS(v3, i); \
271 const uint##BITS##_t c = s390_vec_read_element##BITS(v4, i); \
273 s390_vec_write_element##BITS(v1, i, a * b + c); \
283 int i; \
285 for (i = 0; i < (128 / BITS); i++) { \
286 const int32_t a = (int##BITS##_t)s390_vec_read_element##BITS(v2, i); \
287 const int32_t b = (int##BITS##_t)s390_vec_read_element##BITS(v3, i); \
288 const int32_t c = (int##BITS##_t)s390_vec_read_element##BITS(v4, i); \
290 s390_vec_write_element##BITS(v1, i, (a * b + c) >> BITS); \
300 int i; \
302 for (i = 0; i < (128 / BITS); i++) { \
303 const uint##BITS##_t a = s390_vec_read_element##BITS(v2, i); \
304 const uint##BITS##_t b = s390_vec_read_element##BITS(v3, i); \
305 const uint##BITS##_t c = s390_vec_read_element##BITS(v4, i); \
307 s390_vec_write_element##BITS(v1, i, (a * b + c) >> BITS); \
317 int i, j; \
319 for (i = 0, j = 0; i < (128 / TBITS); i++, j += 2) { \
322 int##TBITS##_t c = s390_vec_read_element##TBITS(v4, i); \
324 s390_vec_write_element##TBITS(v1, i, a * b + c); \
335 int i, j; \
337 for (i = 0, j = 0; i < (128 / TBITS); i++, j += 2) { \
340 uint##TBITS##_t c = s390_vec_read_element##TBITS(v4, i); \
342 s390_vec_write_element##TBITS(v1, i, a * b + c); \
353 int i, j; \
355 for (i = 0, j = 1; i < (128 / TBITS); i++, j += 2) { \
358 int##TBITS##_t c = s390_vec_read_element##TBITS(v4, i); \
360 s390_vec_write_element##TBITS(v1, i, a * b + c); \
371 int i, j; \
373 for (i = 0, j = 1; i < (128 / TBITS); i++, j += 2) { \
376 uint##TBITS##_t c = s390_vec_read_element##TBITS(v4, i); \
378 s390_vec_write_element##TBITS(v1, i, a * b + c); \
389 int i; \
391 for (i = 0; i < (128 / BITS); i++) { \
392 const int32_t a = (int##BITS##_t)s390_vec_read_element##BITS(v2, i); \
393 const int32_t b = (int##BITS##_t)s390_vec_read_element##BITS(v3, i); \
395 s390_vec_write_element##BITS(v1, i, (a * b) >> BITS); \
405 int i; \
407 for (i = 0; i < (128 / BITS); i++) { \
408 const uint##BITS##_t a = s390_vec_read_element##BITS(v2, i); \
409 const uint##BITS##_t b = s390_vec_read_element##BITS(v3, i); \
411 s390_vec_write_element##BITS(v1, i, (a * b) >> BITS); \
421 int i, j; \
423 for (i = 0, j = 0; i < (128 / TBITS); i++, j += 2) { \
427 s390_vec_write_element##TBITS(v1, i, a * b); \
438 int i, j; \
440 for (i = 0, j = 0; i < (128 / TBITS); i++, j += 2) { \
444 s390_vec_write_element##TBITS(v1, i, a * b); \
455 int i, j; \
457 for (i = 0, j = 1; i < (128 / TBITS); i++, j += 2) { \
461 s390_vec_write_element##TBITS(v1, i, a * b); \
472 int i, j; \
474 for (i = 0, j = 1; i < (128 / TBITS); i++, j += 2) { \
478 s390_vec_write_element##TBITS(v1, i, a * b); \
488 int i; \
490 for (i = 0; i < (128 / BITS); i++) { \
491 const uint##BITS##_t a = s390_vec_read_element##BITS(v2, i); \
493 s390_vec_write_element##BITS(v1, i, ctpop32(a)); \
504 int i; \
506 for (i = 0; i < (128 / BITS); i++) { \
507 const uint##BITS##_t a = s390_vec_read_element##BITS(v1, i); \
508 const uint##BITS##_t b = s390_vec_read_element##BITS(v2, i); \
509 const uint##BITS##_t mask = s390_vec_read_element##BITS(v3, i); \
512 s390_vec_write_element##BITS(v1, i, d); \
529 int i; in HELPER() local
531 for (i = 15; i >= 0; --i, e1 = e0) { in HELPER()
532 e0 = s390_vec_read_element8(v2, i); in HELPER()
533 sh = s390_vec_read_element8(v3, i) & 7; in HELPER()
535 s390_vec_write_element8(&tmp, i, rol32(e0 | (e1 << 24), sh)); in HELPER()
552 int i = 0; in HELPER() local
555 e0 = (int32_t)(int8_t)s390_vec_read_element8(v2, i); in HELPER()
556 sh = s390_vec_read_element8(v3, i) & 7; in HELPER()
557 s390_vec_write_element8(&tmp, i, e0 >> sh); in HELPER()
560 for (i = 1; i < 16; ++i, e1 = e0) { in HELPER()
561 e0 = s390_vec_read_element8(v2, i); in HELPER()
562 sh = s390_vec_read_element8(v3, i) & 7; in HELPER()
563 s390_vec_write_element8(&tmp, i, (e0 | e1 << 8) >> sh); in HELPER()
581 for (int i = 0; i < 16; ++i, e1 = e0) { in HELPER() local
582 e0 = s390_vec_read_element8(v2, i); in HELPER()
583 sh = s390_vec_read_element8(v3, i) & 7; in HELPER()
585 s390_vec_write_element8(&tmp, i, (e0 | (e1 << 8)) >> sh); in HELPER()
595 int i; \
597 for (i = 0; i < (128 / BITS); i++) { \
598 const uint##BITS##_t a = s390_vec_read_element##BITS(v2, i); \
599 const uint##BITS##_t b = s390_vec_read_element##BITS(v3, i); \
601 s390_vec_write_element##BITS(v1, i, a >= b); \