mirror of git://gcc.gnu.org/git/gcc.git
				
				
				
			
		
			
				
	
	
		
			131 lines
		
	
	
		
			3.0 KiB
		
	
	
	
		
			C
		
	
	
	
			
		
		
	
	
			131 lines
		
	
	
		
			3.0 KiB
		
	
	
	
		
			C
		
	
	
	
| // { dg-do run }
 | |
| // { dg-additional-options "-msse2" { target sse2_runtime } }
 | |
| // { dg-additional-options "-mavx" { target avx_runtime } }
 | |
| 
 | |
| extern "C" void abort ();
 | |
| int a[1024] __attribute__((aligned (32))) = { 1 };
 | |
| int b[1024] __attribute__((aligned (32))) = { 1 };
 | |
| unsigned char c[1024] __attribute__((aligned (32))) = { 1 };
 | |
| int k, m;
 | |
| __UINTPTR_TYPE__ u, u2, u3;
 | |
| 
 | |
| __attribute__((noinline, noclone)) int
 | |
| foo (int *p)
 | |
| {
 | |
|   int i, s = 0, s2 = 0, t, t2;
 | |
|   #pragma omp simd aligned(a, b, p : 32) linear(k: m + 1) reduction(+:s) \
 | |
| 		   lastprivate (t2)
 | |
|   for (i = 0; i < 512; i++)
 | |
|     {
 | |
|       a[i] *= p[i];
 | |
|       t2 = k + p[i];
 | |
|       k += m + 1;
 | |
|       s += p[i] + k;
 | |
|       c[i]++;
 | |
|     }
 | |
|   #pragma omp simd aligned(a, b, p : 32) linear(k: m + 1) reduction(+:s2) \
 | |
| 		   lastprivate (t, u, u2, u3)
 | |
|   for (i = 512; i < 1024; i++)
 | |
|     {
 | |
|       a[i] *= p[i];
 | |
|       k += m + 1;
 | |
|       t = k + p[i];
 | |
|       u = (__UINTPTR_TYPE__) &k;
 | |
|       u2 = (__UINTPTR_TYPE__) &s2;
 | |
|       u3 = (__UINTPTR_TYPE__) &t;
 | |
|       s2 += t;
 | |
|       c[i]++;
 | |
|     }
 | |
|   return s + s2 + t + t2;
 | |
| }
 | |
| 
 | |
| __attribute__((noinline, noclone)) long int
 | |
| bar (int *p, long int n, long int o)
 | |
| {
 | |
|   long int i, s = 0, s2 = 0, t, t2;
 | |
|   #pragma omp simd aligned(a, b, p : 32) linear(k: m + 1) reduction(+:s) \
 | |
| 		   lastprivate (t2)
 | |
|   for (i = 0; i < n; i++)
 | |
|     {
 | |
|       a[i] *= p[i];
 | |
|       t2 = k + p[i];
 | |
|       k += m + 1;
 | |
|       s += p[i] + k;
 | |
|       c[i]++;
 | |
|     }
 | |
|   #pragma omp simd aligned(a, b, p : 32) linear(k: m + 1) reduction(+:s2) \
 | |
| 		   lastprivate (t, u, u2, u3)
 | |
|   for (i = n; i < o; i++)
 | |
|     {
 | |
|       a[i] *= p[i];
 | |
|       k += m + 1;
 | |
|       t = k + p[i];
 | |
|       u = (__UINTPTR_TYPE__) &k;
 | |
|       u2 = (__UINTPTR_TYPE__) &s2;
 | |
|       u3 = (__UINTPTR_TYPE__) &t;
 | |
|       s2 += t;
 | |
|       c[i]++;
 | |
|     }
 | |
|   return s + s2 + t + t2;
 | |
| }
 | |
| 
 | |
| int
 | |
| main ()
 | |
| {
 | |
| #if __SIZEOF_INT__ >= 4
 | |
|   int i;
 | |
|   k = 4;
 | |
|   m = 2;
 | |
|   for (i = 0; i < 1024; i++)
 | |
|     {
 | |
|       a[i] = i - 512;
 | |
|       b[i] = (i - 51) % 39;
 | |
|       c[i] = (unsigned char) i;
 | |
|     }
 | |
|   int s = foo (b);
 | |
|   for (i = 0; i < 1024; i++)
 | |
|     {
 | |
|       if (b[i] != (i - 51) % 39
 | |
| 	  || a[i] != (i - 512) * b[i]
 | |
| 	  || c[i] != (unsigned char) (i + 1))
 | |
| 	abort ();
 | |
|       a[i] = i - 512;
 | |
|     }
 | |
|   if (k != 4 + 3 * 1024
 | |
|       || s != 1596127 + (4 + 3 * 511 + b[511]) + (4 + 3 * 1024 + b[1023]))
 | |
|     abort ();
 | |
|   k = 4;
 | |
|   s = bar (b, 512, 1024);
 | |
|   for (i = 0; i < 1024; i++)
 | |
|     {
 | |
|       if (b[i] != (i - 51) % 39
 | |
| 	  || a[i] != (i - 512) * b[i]
 | |
| 	  || c[i] != (unsigned char) (i + 2))
 | |
| 	abort ();
 | |
|       a[i] = i - 512;
 | |
|     }
 | |
|   if (k != 4 + 3 * 1024
 | |
|       || s != 1596127 + (4 + 3 * 511 + b[511]) + (4 + 3 * 1024 + b[1023]))
 | |
|     abort ();
 | |
|   k = 4;
 | |
|   s = bar (b, 511, 1021);
 | |
|   for (i = 0; i < 1021; i++)
 | |
|     {
 | |
|       if (b[i] != (i - 51) % 39
 | |
| 	  || a[i] != (i - 512) * b[i]
 | |
| 	  || c[i] != (unsigned char) (i + 3))
 | |
| 	abort ();
 | |
|       a[i] = i - 512;
 | |
|     }
 | |
|   for (i = 1021; i < 1024; i++)
 | |
|     if (b[i] != (i - 51) % 39
 | |
| 	|| a[i] != i - 512
 | |
| 	|| c[i] != (unsigned char) (i + 2))
 | |
|       abort ();
 | |
|   if (k != 4 + 3 * 1021
 | |
|       || s != 1586803 + (4 + 3 * 510 + b[510]) + (4 + 3 * 1021 + b[1020]))
 | |
|     abort ();
 | |
| #endif
 | |
|   return 0;
 | |
| }
 |