| 
1 | 1 | // REQUIRES: amdgpu-registered-target  | 
2 |  | -// RUN: %clang_cc1 -triple amdgcn-unknown-unknown -target-cpu gfx940 -S -emit-llvm -o - %s | FileCheck %s --check-prefix=CHECK-GFX940  | 
 | 2 | +// RUN: %clang_cc1 -triple amdgcn-unknown-unknown -target-cpu gfx940  -S -emit-llvm -o - %s | FileCheck %s  | 
 | 3 | +// RUN: %clang_cc1 -triple amdgcn-unknown-unknown -target-cpu gfx1200 -S -emit-llvm -o - %s | FileCheck %s  | 
3 | 4 | 
 
  | 
4 | 5 | typedef float  v2f   __attribute__((ext_vector_type(2)));  | 
5 | 6 | 
 
  | 
6 |  | -// CHECK-GFX940-LABEL: @test_cvt_f32_bf8  | 
7 |  | -// CHECK-GFX940: call float @llvm.amdgcn.cvt.f32.bf8(i32 %a, i32 0)  | 
 | 7 | +// CHECK-LABEL: @test_cvt_f32_bf8  | 
 | 8 | +// CHECK: call float @llvm.amdgcn.cvt.f32.bf8(i32 %a, i32 0)  | 
8 | 9 | void test_cvt_f32_bf8(global int* out, int a)  | 
9 | 10 | {  | 
10 | 11 |   *out = __builtin_amdgcn_cvt_f32_bf8(a, 0);  | 
11 | 12 | }  | 
12 | 13 | 
 
  | 
13 |  | -// CHECK-GFX940-LABEL: @test_cvt_f32_fp8  | 
14 |  | -// CHECK-GFX940: call float @llvm.amdgcn.cvt.f32.fp8(i32 %a, i32 1)  | 
 | 14 | +// CHECK-LABEL: @test_cvt_f32_fp8  | 
 | 15 | +// CHECK: call float @llvm.amdgcn.cvt.f32.fp8(i32 %a, i32 1)  | 
15 | 16 | void test_cvt_f32_fp8(global int* out, int a)  | 
16 | 17 | {  | 
17 | 18 |   *out = __builtin_amdgcn_cvt_f32_fp8(a, 1);  | 
18 | 19 | }  | 
19 | 20 | 
 
  | 
20 |  | -// CHECK-GFX940-LABEL: @test_cvt_pk_f32_bf8  | 
21 |  | -// CHECK-GFX940: call <2 x float> @llvm.amdgcn.cvt.pk.f32.bf8(i32 %a, i1 false)  | 
 | 21 | +// CHECK-LABEL: @test_cvt_pk_f32_bf8  | 
 | 22 | +// CHECK: call <2 x float> @llvm.amdgcn.cvt.pk.f32.bf8(i32 %a, i1 false)  | 
22 | 23 | void test_cvt_pk_f32_bf8(global v2f* out, int a)  | 
23 | 24 | {  | 
24 | 25 |   *out = __builtin_amdgcn_cvt_pk_f32_bf8(a, false);  | 
25 | 26 | }  | 
26 | 27 | 
 
  | 
27 |  | -// CHECK-GFX940-LABEL: @test_cvt_pk_f32_fp8  | 
28 |  | -// CHECK-GFX940: call <2 x float> @llvm.amdgcn.cvt.pk.f32.fp8(i32 %a, i1 true)  | 
 | 28 | +// CHECK-LABEL: @test_cvt_pk_f32_fp8  | 
 | 29 | +// CHECK: call <2 x float> @llvm.amdgcn.cvt.pk.f32.fp8(i32 %a, i1 true)  | 
29 | 30 | void test_cvt_pk_f32_fp8(global v2f* out, int a)  | 
30 | 31 | {  | 
31 | 32 |   *out = __builtin_amdgcn_cvt_pk_f32_fp8(a, true);  | 
32 | 33 | }  | 
33 | 34 | 
 
  | 
34 |  | -// CHECK-GFX940-LABEL: @test_cvt_pk_bf8_f32  | 
35 |  | -// CHECK-GFX940: call i32 @llvm.amdgcn.cvt.pk.bf8.f32(float %a, float %b, i32 %old, i1 false)  | 
 | 35 | +// CHECK-LABEL: @test_cvt_pk_bf8_f32  | 
 | 36 | +// CHECK: call i32 @llvm.amdgcn.cvt.pk.bf8.f32(float %a, float %b, i32 %old, i1 false)  | 
36 | 37 | void test_cvt_pk_bf8_f32(global int* out, int old, float a, float b)  | 
37 | 38 | {  | 
38 | 39 |   *out = __builtin_amdgcn_cvt_pk_bf8_f32(a, b, old, false);  | 
39 | 40 | }  | 
40 | 41 | 
 
  | 
41 |  | -// CHECK-GFX940-LABEL: @test_cvt_pk_fp8_f32  | 
42 |  | -// CHECK-GFX940: call i32 @llvm.amdgcn.cvt.pk.fp8.f32(float %a, float %b, i32 %old, i1 true)  | 
 | 42 | +// CHECK-LABEL: @test_cvt_pk_fp8_f32  | 
 | 43 | +// CHECK: call i32 @llvm.amdgcn.cvt.pk.fp8.f32(float %a, float %b, i32 %old, i1 true)  | 
43 | 44 | void test_cvt_pk_fp8_f32(global int* out, int old, float a, float b)  | 
44 | 45 | {  | 
45 | 46 |   *out = __builtin_amdgcn_cvt_pk_fp8_f32(a, b, old, true);  | 
46 | 47 | }  | 
47 | 48 | 
 
  | 
48 |  | -// CHECK-GFX940-LABEL: @test_cvt_sr_bf8_f32  | 
49 |  | -// CHECK-GFX940: call i32 @llvm.amdgcn.cvt.sr.bf8.f32(float %a, i32 %b, i32 %old, i32 2)  | 
 | 49 | +// CHECK-LABEL: @test_cvt_sr_bf8_f32  | 
 | 50 | +// CHECK: call i32 @llvm.amdgcn.cvt.sr.bf8.f32(float %a, i32 %b, i32 %old, i32 2)  | 
50 | 51 | void test_cvt_sr_bf8_f32(global int* out, int old, float a, int b)  | 
51 | 52 | {  | 
52 | 53 |   *out = __builtin_amdgcn_cvt_sr_bf8_f32(a, b, old, 2);  | 
53 | 54 | }  | 
54 | 55 | 
 
  | 
55 |  | -// CHECK-GFX940-LABEL: @test_cvt_sr_fp8_f32  | 
56 |  | -// CHECK-GFX940: call i32 @llvm.amdgcn.cvt.sr.fp8.f32(float %a, i32 %b, i32 %old, i32 3)  | 
 | 56 | +// CHECK-LABEL: @test_cvt_sr_fp8_f32  | 
 | 57 | +// CHECK: call i32 @llvm.amdgcn.cvt.sr.fp8.f32(float %a, i32 %b, i32 %old, i32 3)  | 
57 | 58 | void test_cvt_sr_fp8_f32(global int* out, int old, float a, int b)  | 
58 | 59 | {  | 
59 | 60 |   *out = __builtin_amdgcn_cvt_sr_fp8_f32(a, b, old, 3);  | 
 | 
0 commit comments