forked from OSchip/llvm-project
114 lines
2.7 KiB
C
114 lines
2.7 KiB
C
// RUN: %libomp-compile-and-run
|
|
// RUN: %libomp-compile && env KMP_TASKLOOP_MIN_TASKS=1 %libomp-run
|
|
|
|
// These compilers don't support the taskloop construct
|
|
// UNSUPPORTED: gcc-4, gcc-5, icc-16
|
|
// GCC 6 has support for taskloops, but at least 6.3.0 is crashing on this test
|
|
// UNSUPPORTED: gcc-6
|
|
|
|
/*
|
|
* Test for taskloop
|
|
* Method: calculate how many times the iteration space is dispatched
|
|
* and judge if each dispatch has the requested grainsize
|
|
* It is possible for two adjacent chunks are executed by the same thread
|
|
*/
|
|
#include <stdio.h>
|
|
#include <omp.h>
|
|
#include <stdlib.h>
|
|
#include "omp_testsuite.h"
|
|
|
|
#define CFDMAX_SIZE 1120
|
|
|
|
int test_omp_taskloop_grainsize()
|
|
{
|
|
int result = 0;
|
|
int i, grainsize, count, tmp_count, num_off;
|
|
int *tmp, *tids, *tidsArray;
|
|
|
|
tidsArray = (int *)malloc(sizeof(int) * CFDMAX_SIZE);
|
|
tids = tidsArray;
|
|
|
|
for (grainsize = 1; grainsize < 48; ++grainsize) {
|
|
fprintf(stderr, "Grainsize %d\n", grainsize);
|
|
count = tmp_count = num_off = 0;
|
|
|
|
for (i = 0; i < CFDMAX_SIZE; ++i) {
|
|
tids[i] = -1;
|
|
}
|
|
|
|
#pragma omp parallel shared(tids)
|
|
{
|
|
#pragma omp master
|
|
#pragma omp taskloop grainsize(grainsize)
|
|
for (i = 0; i < CFDMAX_SIZE; i++) {
|
|
tids[i] = omp_get_thread_num();
|
|
}
|
|
}
|
|
|
|
for (i = 0; i < CFDMAX_SIZE; ++i) {
|
|
if (tids[i] == -1) {
|
|
fprintf(stderr, " Iteration %d not touched!\n", i);
|
|
result++;
|
|
}
|
|
}
|
|
|
|
for (i = 0; i < CFDMAX_SIZE - 1; ++i) {
|
|
if (tids[i] != tids[i + 1]) {
|
|
count++;
|
|
}
|
|
}
|
|
|
|
tmp = (int *)malloc(sizeof(int) * (count + 1));
|
|
tmp[0] = 1;
|
|
|
|
for (i = 0; i < CFDMAX_SIZE - 1; ++i) {
|
|
if (tmp_count > count) {
|
|
printf("--------------------\nTestinternal Error: List too "
|
|
"small!!!\n--------------------\n");
|
|
break;
|
|
}
|
|
if (tids[i] != tids[i + 1]) {
|
|
tmp_count++;
|
|
tmp[tmp_count] = 1;
|
|
} else {
|
|
tmp[tmp_count]++;
|
|
}
|
|
}
|
|
|
|
// is grainsize statement working?
|
|
int num_tasks = CFDMAX_SIZE / grainsize;
|
|
int multiple1 = CFDMAX_SIZE / num_tasks;
|
|
int multiple2 = CFDMAX_SIZE / num_tasks + 1;
|
|
for (i = 0; i < count; i++) {
|
|
// it is possible for 2 adjacent chunks assigned to a same thread
|
|
if (tmp[i] % multiple1 != 0 && tmp[i] % multiple2 != 0) {
|
|
num_off++;
|
|
}
|
|
}
|
|
|
|
if (num_off > 1) {
|
|
fprintf(stderr, " The number of bad chunks is %d\n", num_off);
|
|
result++;
|
|
} else {
|
|
fprintf(stderr, " Everything ok\n");
|
|
}
|
|
|
|
free(tmp);
|
|
}
|
|
free(tidsArray);
|
|
return (result==0);
|
|
}
|
|
|
|
int main()
|
|
{
|
|
int i;
|
|
int num_failed=0;
|
|
|
|
for (i = 0; i < REPETITIONS; i++) {
|
|
if (!test_omp_taskloop_grainsize()) {
|
|
num_failed++;
|
|
}
|
|
}
|
|
return num_failed;
|
|
}
|