teams-2.c 1.3 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172
  1. /* { dg-do run } */
  2. #include <stdlib.h>
  3. #define EPS 0.0001
  4. #define N 1024*1024
  5. void init (float B[], float C[], int n)
  6. {
  7. int i;
  8. for (i = 0; i < n; i++)
  9. {
  10. B[i] = 0.1 * i;
  11. C[i] = 0.01 * i * i;
  12. }
  13. }
  14. float dotprod_ref (float B[], float C[], int n)
  15. {
  16. int i;
  17. float sum = 0.0;
  18. for (i = 0; i < n; i++)
  19. sum += B[i] * C[i];
  20. return sum;
  21. }
  22. float dotprod (float B[], float C[], int n, int block_size,
  23. int num_teams, int block_threads)
  24. {
  25. int i, i0;
  26. float sum = 0;
  27. #pragma omp target map(to: B[0:n], C[0:n]) map(tofrom: sum)
  28. #pragma omp teams num_teams(num_teams) thread_limit(block_threads) \
  29. reduction(+:sum)
  30. #pragma omp distribute
  31. for (i0 = 0; i0 < n; i0 += block_size)
  32. #pragma omp parallel for reduction(+:sum)
  33. for (i = i0; i < ((i0 + block_size > n) ? n : i0 + block_size); i++)
  34. sum += B[i] * C[i];
  35. return sum;
  36. }
  37. void check (float a, float b)
  38. {
  39. float err = (b == 0.0) ? a : (a - b) / b;
  40. if (((err > 0) ? err : -err) > EPS)
  41. abort ();
  42. }
  43. int main ()
  44. {
  45. float *v1 = (float *) malloc (N * sizeof (float));
  46. float *v2 = (float *) malloc (N * sizeof (float));
  47. float p1, p2;
  48. init (v1, v2, N);
  49. p1 = dotprod_ref (v1, v2, N);
  50. p2 = dotprod (v1, v2, N, N / 8, 2, 8);
  51. check (p1, p2);
  52. free (v1);
  53. free (v2);
  54. return 0;
  55. }