| // RUN: %clang_cc1 %s -ffreestanding -triple=x86_64-unknown-unknown -target-feature +avx512f -target-feature +amx-int8 \ |
| // RUN: -target-feature +amx-bf16 -emit-llvm -o - -Werror -pedantic | FileCheck %s --check-prefixes=CHECK |
| |
| #include <immintrin.h> |
| |
| char buf[1024]; |
| #define STRIDE 32 |
| |
| char buf2[1024]; |
| |
| // This is an example code and integration test. |
| void test_api(int cond, short row, short col) { |
| //CHECK-LABEL: @test_api |
| //CHECK: call x86_amx @llvm.x86.tileloadd64.internal |
| //CHECK: call x86_amx @llvm.x86.tdpbssd.internal |
| //CHECK: call void @llvm.x86.tilestored64.internal |
| __tile1024i a = {row, 8}; |
| __tile1024i b = {8, col}; |
| __tile1024i c = {row, col}; |
| |
| if (cond) { |
| __tile_loadd(&a, buf, STRIDE); |
| __tile_loadd(&b, buf, STRIDE); |
| __tile_loadd(&c, buf, STRIDE); |
| } else { |
| __tile_loadd(&a, buf2, STRIDE); |
| __tile_loadd(&b, buf2, STRIDE); |
| __tile_loadd(&c, buf2, STRIDE); |
| } |
| __tile_dpbssd(&c, a, b); |
| __tile_stored(buf, STRIDE, c); |
| } |
| |
| void test_tile_loadd(short row, short col) { |
| //CHECK-LABEL: @test_tile_loadd |
| //CHECK: call x86_amx @llvm.x86.tileloadd64.internal |
| //CHECK-NEXT: {{%.*}} = bitcast x86_amx {{%.*}} to <256 x i32> |
| __tile1024i a = {row, col}; |
| __tile_loadd(&a, buf, STRIDE); |
| } |
| |
| void test_tile_dpbssd(__tile1024i a, __tile1024i b, __tile1024i c) { |
| //CHECK-LABEL: @test_tile_dpbssd |
| //CHECK: call x86_amx @llvm.x86.tdpbssd.internal |
| //CHECK-NEXT: {{%.*}} = bitcast x86_amx {{%.*}} to <256 x i32> |
| __tile_dpbssd(&c, a, b); |
| } |
| |
| void test_tile_stored(__tile1024i c) { |
| //CHECK-LABEL: @test_tile_stored |
| //CHECK: {{%.*}} = bitcast <256 x i32> {{%.*}} to x86_amx |
| //CHECK-NEXT: call void @llvm.x86.tilestored64.internal |
| __tile_stored(buf, STRIDE, c); |
| } |
| |
| void test_tile_zero(__tile1024i c) { |
| //CHECK-LABEL: @test_tile_zero |
| //CHECK: call x86_amx @llvm.x86.tilezero.internal |
| //CHECK-NEXT bitcast x86_amx {{%.*}} to <256 x i32> |
| __tile_zero(&c); |
| } |