| /* { dg-do compile } */ |
| /* { dg-require-effective-target vect_shift } */ |
| /* { dg-require-effective-target vect_int } */ |
| |
| typedef unsigned int uint32_t; |
| typedef short unsigned int uint16_t; |
| |
| int foo (uint32_t arr[4][4]) |
| { |
| int sum = 0; |
| for(int i = 0; i < 4; i++) |
| { |
| sum += ((arr[0][i] >> 10) * 20) + ((arr[1][i] >> 11) & 53) |
| + ((arr[2][i] >> 12) * 7) + ((arr[3][i] >> 13) ^ 43); |
| } |
| return (((uint16_t)sum) + ((uint32_t)sum >> 16)) >> 1; |
| } |
| |
| /* For a target that has a vector/scalar shift/rotate optab, check |
| that we are not adding the cost of creating a vector from the scalar |
| in the prologue. */ |
| /* { dg-final { scan-tree-dump {vectorizable_shift ===[\n\r][^\n]*prologue_cost = 0} "vect" { target { aarch64*-*-* x86_64-*-* } } } } */ |