diff options
Diffstat (limited to 'libgomp/testsuite/libgomp.c/declare-variant-1.c')
-rw-r--r-- | libgomp/testsuite/libgomp.c/declare-variant-1.c | 54 |
1 files changed, 54 insertions, 0 deletions
diff --git a/libgomp/testsuite/libgomp.c/declare-variant-1.c b/libgomp/testsuite/libgomp.c/declare-variant-1.c new file mode 100644 index 0000000..d16608f --- /dev/null +++ b/libgomp/testsuite/libgomp.c/declare-variant-1.c @@ -0,0 +1,54 @@ +/* { dg-do link { target vect_simd_clones } } */ +/* { dg-require-effective-target lto } */ +/* { dg-require-effective-target fpic } */ +/* { dg-require-effective-target shared } */ +/* { dg-additional-options "-fdump-tree-gimple -fdump-tree-optimized -O2 -fPIC -shared -flto -flto-partition=one" } */ +/* { dg-additional-options "-mno-sse3" { target { i?86-*-* x86_64-*-* } } } */ + +int +f01 (int a) +{ + asm volatile ("" : "+g" (a) : "g" (1) : "memory"); + return a; +} + +int +f02 (int a) +{ + asm volatile ("" : "+g" (a) : "g" (2) : "memory"); + return a; +} + +int +f03 (int a) +{ + asm volatile ("" : "+g" (a) : "g" (3) : "memory"); + return a; +} + +#pragma omp declare variant (f01) match (device={isa("avx512f")}) /* 4 or 8 */ +#pragma omp declare variant (f02) match (implementation={vendor(score(3):gnu)},device={kind(cpu)}) /* (1 or 2) + 3 */ +#pragma omp declare variant (f03) match (implementation={vendor(score(5):gnu)},device={kind(host)}) /* (1 or 2) + 5 */ +int +f04 (int a) +{ + asm volatile ("" : "+g" (a) : "g" (4) : "memory"); + return a; +} + +#pragma omp declare simd +int +test1 (int x) +{ + /* At gimplification time, we can't decide yet which function to call. */ + /* { dg-final { scan-tree-dump-times "f04 \\\(x" 2 "gimple" } } */ + /* After simd clones are created, the original non-clone test1 shall + call f03 (score 6), the sse2/avx/avx2 clones too, but avx512f clones + shall call f01 with score 8. */ + /* { dg-final { scan-ltrans-tree-dump-not "f04 \\\(x" "optimized" } } */ + /* { dg-final { scan-ltrans-tree-dump-times "f03 \\\(x" 14 "optimized" } } */ + /* { dg-final { scan-ltrans-tree-dump-times "f01 \\\(x" 4 "optimized" } } */ + int a = f04 (x); + int b = f04 (x); + return a + b; +} |