| ; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py UTC_ARGS: --version 5 |
| ; RUN: llc -mtriple=amdgcn -mcpu=gfx90a < %s | FileCheck %s |
| |
| ;--------------------------------------------------------------------- |
| ; i32 cases |
| ;--------------------------------------------------------------------- |
| |
| define void @global_atomic_cmpxchg_i32_ret_av_av__av(ptr addrspace(1) %ptr) #0 { |
| ; CHECK-LABEL: global_atomic_cmpxchg_i32_ret_av_av__av: |
| ; CHECK: ; %bb.0: |
| ; CHECK-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0) |
| ; CHECK-NEXT: ;;#ASMSTART |
| ; CHECK-NEXT: ; def v[4:5] |
| ; CHECK-NEXT: ;;#ASMEND |
| ; CHECK-NEXT: ;;#ASMSTART |
| ; CHECK-NEXT: ; def v[2:3] |
| ; CHECK-NEXT: ;;#ASMEND |
| ; CHECK-NEXT: buffer_wbl2 |
| ; CHECK-NEXT: global_atomic_cmpswap_x2 v[0:1], v[0:1], v[2:5], off offset:80 glc |
| ; CHECK-NEXT: s_waitcnt vmcnt(0) |
| ; CHECK-NEXT: buffer_invl2 |
| ; CHECK-NEXT: buffer_wbinvl1_vol |
| ; CHECK-NEXT: ;;#ASMSTART |
| ; CHECK-NEXT: ; use v[0:1] |
| ; CHECK-NEXT: ;;#ASMEND |
| ; CHECK-NEXT: s_setpc_b64 s[30:31] |
| %gep.0 = getelementptr inbounds [512 x i64], ptr addrspace(1) %ptr, i64 0, i64 10 |
| %data0 = call i64 asm "; def $0", "=^VA"() |
| %data1 = call i64 asm "; def $0", "=^VA"() |
| %pair = cmpxchg ptr addrspace(1) %gep.0, i64 %data0, i64 %data1 seq_cst monotonic |
| %result = extractvalue { i64, i1 } %pair, 0 |
| call void asm "; use $0", "^VA"(i64 %result) |
| ret void |
| } |
| |
| define void @global_atomic_cmpxchg_i32_ret_av_av__v(ptr addrspace(1) %ptr) #0 { |
| ; CHECK-LABEL: global_atomic_cmpxchg_i32_ret_av_av__v: |
| ; CHECK: ; %bb.0: |
| ; CHECK-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0) |
| ; CHECK-NEXT: ;;#ASMSTART |
| ; CHECK-NEXT: ; def v[4:5] |
| ; CHECK-NEXT: ;;#ASMEND |
| ; CHECK-NEXT: ;;#ASMSTART |
| ; CHECK-NEXT: ; def v[2:3] |
| ; CHECK-NEXT: ;;#ASMEND |
| ; CHECK-NEXT: buffer_wbl2 |
| ; CHECK-NEXT: global_atomic_cmpswap_x2 v[0:1], v[0:1], v[2:5], off offset:80 glc |
| ; CHECK-NEXT: s_waitcnt vmcnt(0) |
| ; CHECK-NEXT: buffer_invl2 |
| ; CHECK-NEXT: buffer_wbinvl1_vol |
| ; CHECK-NEXT: ;;#ASMSTART |
| ; CHECK-NEXT: ; use v[0:1] |
| ; CHECK-NEXT: ;;#ASMEND |
| ; CHECK-NEXT: s_setpc_b64 s[30:31] |
| %gep.0 = getelementptr inbounds [512 x i64], ptr addrspace(1) %ptr, i64 0, i64 10 |
| %data0 = call i64 asm "; def $0", "=^VA"() |
| %data1 = call i64 asm "; def $0", "=^VA"() |
| %pair = cmpxchg ptr addrspace(1) %gep.0, i64 %data0, i64 %data1 seq_cst monotonic |
| %result = extractvalue { i64, i1 } %pair, 0 |
| call void asm "; use $0", "v"(i64 %result) |
| ret void |
| } |
| |
| define void @global_atomic_cmpxchg_i32_ret_av_av__a(ptr addrspace(1) %ptr) #0 { |
| ; CHECK-LABEL: global_atomic_cmpxchg_i32_ret_av_av__a: |
| ; CHECK: ; %bb.0: |
| ; CHECK-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0) |
| ; CHECK-NEXT: ;;#ASMSTART |
| ; CHECK-NEXT: ; def v[4:5] |
| ; CHECK-NEXT: ;;#ASMEND |
| ; CHECK-NEXT: ;;#ASMSTART |
| ; CHECK-NEXT: ; def v[2:3] |
| ; CHECK-NEXT: ;;#ASMEND |
| ; CHECK-NEXT: buffer_wbl2 |
| ; CHECK-NEXT: global_atomic_cmpswap_x2 v[0:1], v[0:1], v[2:5], off offset:80 glc |
| ; CHECK-NEXT: s_waitcnt vmcnt(0) |
| ; CHECK-NEXT: buffer_invl2 |
| ; CHECK-NEXT: buffer_wbinvl1_vol |
| ; CHECK-NEXT: v_accvgpr_write_b32 a0, v0 |
| ; CHECK-NEXT: v_accvgpr_write_b32 a1, v1 |
| ; CHECK-NEXT: ;;#ASMSTART |
| ; CHECK-NEXT: ; use a[0:1] |
| ; CHECK-NEXT: ;;#ASMEND |
| ; CHECK-NEXT: s_setpc_b64 s[30:31] |
| %gep.0 = getelementptr inbounds [512 x i64], ptr addrspace(1) %ptr, i64 0, i64 10 |
| %data0 = call i64 asm "; def $0", "=^VA"() |
| %data1 = call i64 asm "; def $0", "=^VA"() |
| %pair = cmpxchg ptr addrspace(1) %gep.0, i64 %data0, i64 %data1 seq_cst monotonic |
| %result = extractvalue { i64, i1 } %pair, 0 |
| call void asm "; use $0", "a"(i64 %result) |
| ret void |
| } |
| |
| define void @global_atomic_cmpxchg_i32_ret_a_a__a(ptr addrspace(1) %ptr) #0 { |
| ; CHECK-LABEL: global_atomic_cmpxchg_i32_ret_a_a__a: |
| ; CHECK: ; %bb.0: |
| ; CHECK-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0) |
| ; CHECK-NEXT: ;;#ASMSTART |
| ; CHECK-NEXT: ; def a[0:1] |
| ; CHECK-NEXT: ;;#ASMEND |
| ; CHECK-NEXT: v_accvgpr_read_b32 v5, a1 |
| ; CHECK-NEXT: v_accvgpr_read_b32 v4, a0 |
| ; CHECK-NEXT: ;;#ASMSTART |
| ; CHECK-NEXT: ; def a[0:1] |
| ; CHECK-NEXT: ;;#ASMEND |
| ; CHECK-NEXT: v_accvgpr_read_b32 v3, a1 |
| ; CHECK-NEXT: v_accvgpr_read_b32 v2, a0 |
| ; CHECK-NEXT: buffer_wbl2 |
| ; CHECK-NEXT: global_atomic_cmpswap_x2 v[0:1], v[0:1], v[2:5], off offset:80 glc |
| ; CHECK-NEXT: s_waitcnt vmcnt(0) |
| ; CHECK-NEXT: buffer_invl2 |
| ; CHECK-NEXT: buffer_wbinvl1_vol |
| ; CHECK-NEXT: v_accvgpr_write_b32 a0, v0 |
| ; CHECK-NEXT: v_accvgpr_write_b32 a1, v1 |
| ; CHECK-NEXT: ;;#ASMSTART |
| ; CHECK-NEXT: ; use a[0:1] |
| ; CHECK-NEXT: ;;#ASMEND |
| ; CHECK-NEXT: s_setpc_b64 s[30:31] |
| %gep.0 = getelementptr inbounds [512 x i64], ptr addrspace(1) %ptr, i64 0, i64 10 |
| %data0 = call i64 asm "; def $0", "=a"() |
| %data1 = call i64 asm "; def $0", "=a"() |
| %pair = cmpxchg ptr addrspace(1) %gep.0, i64 %data0, i64 %data1 seq_cst monotonic |
| %result = extractvalue { i64, i1 } %pair, 0 |
| call void asm "; use $0", "a"(i64 %result) |
| ret void |
| } |
| |
| define void @global_atomic_cmpxchg_i32_ret_a_a__v(ptr addrspace(1) %ptr) #0 { |
| ; CHECK-LABEL: global_atomic_cmpxchg_i32_ret_a_a__v: |
| ; CHECK: ; %bb.0: |
| ; CHECK-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0) |
| ; CHECK-NEXT: ;;#ASMSTART |
| ; CHECK-NEXT: ; def a[0:1] |
| ; CHECK-NEXT: ;;#ASMEND |
| ; CHECK-NEXT: v_accvgpr_read_b32 v5, a1 |
| ; CHECK-NEXT: v_accvgpr_read_b32 v4, a0 |
| ; CHECK-NEXT: ;;#ASMSTART |
| ; CHECK-NEXT: ; def a[0:1] |
| ; CHECK-NEXT: ;;#ASMEND |
| ; CHECK-NEXT: v_accvgpr_read_b32 v3, a1 |
| ; CHECK-NEXT: v_accvgpr_read_b32 v2, a0 |
| ; CHECK-NEXT: buffer_wbl2 |
| ; CHECK-NEXT: global_atomic_cmpswap_x2 v[0:1], v[0:1], v[2:5], off offset:80 glc |
| ; CHECK-NEXT: s_waitcnt vmcnt(0) |
| ; CHECK-NEXT: buffer_invl2 |
| ; CHECK-NEXT: buffer_wbinvl1_vol |
| ; CHECK-NEXT: ;;#ASMSTART |
| ; CHECK-NEXT: ; use v[0:1] |
| ; CHECK-NEXT: ;;#ASMEND |
| ; CHECK-NEXT: s_setpc_b64 s[30:31] |
| %gep.0 = getelementptr inbounds [512 x i64], ptr addrspace(1) %ptr, i64 0, i64 10 |
| %data0 = call i64 asm "; def $0", "=a"() |
| %data1 = call i64 asm "; def $0", "=a"() |
| %pair = cmpxchg ptr addrspace(1) %gep.0, i64 %data0, i64 %data1 seq_cst monotonic |
| %result = extractvalue { i64, i1 } %pair, 0 |
| call void asm "; use $0", "v"(i64 %result) |
| ret void |
| } |
| |
| define void @global_atomic_cmpxchg_i32_ret_v_a__v(ptr addrspace(1) %ptr) #0 { |
| ; CHECK-LABEL: global_atomic_cmpxchg_i32_ret_v_a__v: |
| ; CHECK: ; %bb.0: |
| ; CHECK-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0) |
| ; CHECK-NEXT: ;;#ASMSTART |
| ; CHECK-NEXT: ; def a[0:1] |
| ; CHECK-NEXT: ;;#ASMEND |
| ; CHECK-NEXT: v_accvgpr_read_b32 v3, a1 |
| ; CHECK-NEXT: v_accvgpr_read_b32 v2, a0 |
| ; CHECK-NEXT: ;;#ASMSTART |
| ; CHECK-NEXT: ; def v[4:5] |
| ; CHECK-NEXT: ;;#ASMEND |
| ; CHECK-NEXT: buffer_wbl2 |
| ; CHECK-NEXT: global_atomic_cmpswap_x2 v[0:1], v[0:1], v[2:5], off offset:80 glc |
| ; CHECK-NEXT: s_waitcnt vmcnt(0) |
| ; CHECK-NEXT: buffer_invl2 |
| ; CHECK-NEXT: buffer_wbinvl1_vol |
| ; CHECK-NEXT: ;;#ASMSTART |
| ; CHECK-NEXT: ; use v[0:1] |
| ; CHECK-NEXT: ;;#ASMEND |
| ; CHECK-NEXT: s_setpc_b64 s[30:31] |
| %gep.0 = getelementptr inbounds [512 x i64], ptr addrspace(1) %ptr, i64 0, i64 10 |
| %data0 = call i64 asm "; def $0", "=v"() |
| %data1 = call i64 asm "; def $0", "=a"() |
| %pair = cmpxchg ptr addrspace(1) %gep.0, i64 %data0, i64 %data1 seq_cst monotonic |
| %result = extractvalue { i64, i1 } %pair, 0 |
| call void asm "; use $0", "v"(i64 %result) |
| ret void |
| } |
| |
| define void @global_atomic_cmpxchg_i32_ret_a_v__v(ptr addrspace(1) %ptr) #0 { |
| ; CHECK-LABEL: global_atomic_cmpxchg_i32_ret_a_v__v: |
| ; CHECK: ; %bb.0: |
| ; CHECK-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0) |
| ; CHECK-NEXT: ;;#ASMSTART |
| ; CHECK-NEXT: ; def a[0:1] |
| ; CHECK-NEXT: ;;#ASMEND |
| ; CHECK-NEXT: v_accvgpr_read_b32 v5, a1 |
| ; CHECK-NEXT: v_accvgpr_read_b32 v4, a0 |
| ; CHECK-NEXT: ;;#ASMSTART |
| ; CHECK-NEXT: ; def v[2:3] |
| ; CHECK-NEXT: ;;#ASMEND |
| ; CHECK-NEXT: buffer_wbl2 |
| ; CHECK-NEXT: global_atomic_cmpswap_x2 v[0:1], v[0:1], v[2:5], off offset:80 glc |
| ; CHECK-NEXT: s_waitcnt vmcnt(0) |
| ; CHECK-NEXT: buffer_invl2 |
| ; CHECK-NEXT: buffer_wbinvl1_vol |
| ; CHECK-NEXT: ;;#ASMSTART |
| ; CHECK-NEXT: ; use v[0:1] |
| ; CHECK-NEXT: ;;#ASMEND |
| ; CHECK-NEXT: s_setpc_b64 s[30:31] |
| %gep.0 = getelementptr inbounds [512 x i64], ptr addrspace(1) %ptr, i64 0, i64 10 |
| %data0 = call i64 asm "; def $0", "=a"() |
| %data1 = call i64 asm "; def $0", "=v"() |
| %pair = cmpxchg ptr addrspace(1) %gep.0, i64 %data0, i64 %data1 seq_cst monotonic |
| %result = extractvalue { i64, i1 } %pair, 0 |
| call void asm "; use $0", "v"(i64 %result) |
| ret void |
| } |
| |
| define void @global_atomic_cmpxchg_i32_ret_v_v__a(ptr addrspace(1) %ptr) #0 { |
| ; CHECK-LABEL: global_atomic_cmpxchg_i32_ret_v_v__a: |
| ; CHECK: ; %bb.0: |
| ; CHECK-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0) |
| ; CHECK-NEXT: ;;#ASMSTART |
| ; CHECK-NEXT: ; def v[4:5] |
| ; CHECK-NEXT: ;;#ASMEND |
| ; CHECK-NEXT: ;;#ASMSTART |
| ; CHECK-NEXT: ; def v[2:3] |
| ; CHECK-NEXT: ;;#ASMEND |
| ; CHECK-NEXT: buffer_wbl2 |
| ; CHECK-NEXT: global_atomic_cmpswap_x2 v[0:1], v[0:1], v[2:5], off offset:80 glc |
| ; CHECK-NEXT: s_waitcnt vmcnt(0) |
| ; CHECK-NEXT: buffer_invl2 |
| ; CHECK-NEXT: buffer_wbinvl1_vol |
| ; CHECK-NEXT: v_accvgpr_write_b32 a0, v0 |
| ; CHECK-NEXT: v_accvgpr_write_b32 a1, v1 |
| ; CHECK-NEXT: ;;#ASMSTART |
| ; CHECK-NEXT: ; use a[0:1] |
| ; CHECK-NEXT: ;;#ASMEND |
| ; CHECK-NEXT: s_setpc_b64 s[30:31] |
| %gep.0 = getelementptr inbounds [512 x i64], ptr addrspace(1) %ptr, i64 0, i64 10 |
| %data0 = call i64 asm "; def $0", "=v"() |
| %data1 = call i64 asm "; def $0", "=v"() |
| %pair = cmpxchg ptr addrspace(1) %gep.0, i64 %data0, i64 %data1 seq_cst monotonic |
| %result = extractvalue { i64, i1 } %pair, 0 |
| call void asm "; use $0", "a"(i64 %result) |
| ret void |
| } |
| |
| define void @global_atomic_cmpxchg_i32_ret_av_v__av(ptr addrspace(1) %ptr) #0 { |
| ; CHECK-LABEL: global_atomic_cmpxchg_i32_ret_av_v__av: |
| ; CHECK: ; %bb.0: |
| ; CHECK-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0) |
| ; CHECK-NEXT: ;;#ASMSTART |
| ; CHECK-NEXT: ; def v[4:5] |
| ; CHECK-NEXT: ;;#ASMEND |
| ; CHECK-NEXT: ;;#ASMSTART |
| ; CHECK-NEXT: ; def v[2:3] |
| ; CHECK-NEXT: ;;#ASMEND |
| ; CHECK-NEXT: buffer_wbl2 |
| ; CHECK-NEXT: global_atomic_cmpswap_x2 v[0:1], v[0:1], v[2:5], off offset:80 glc |
| ; CHECK-NEXT: s_waitcnt vmcnt(0) |
| ; CHECK-NEXT: buffer_invl2 |
| ; CHECK-NEXT: buffer_wbinvl1_vol |
| ; CHECK-NEXT: ;;#ASMSTART |
| ; CHECK-NEXT: ; use v[0:1] |
| ; CHECK-NEXT: ;;#ASMEND |
| ; CHECK-NEXT: s_setpc_b64 s[30:31] |
| %gep.0 = getelementptr inbounds [512 x i64], ptr addrspace(1) %ptr, i64 0, i64 10 |
| %data0 = call i64 asm "; def $0", "=^VA"() |
| %data1 = call i64 asm "; def $0", "=v"() |
| %pair = cmpxchg ptr addrspace(1) %gep.0, i64 %data0, i64 %data1 seq_cst monotonic |
| %result = extractvalue { i64, i1 } %pair, 0 |
| call void asm "; use $0", "^VA"(i64 %result) |
| ret void |
| } |
| |
| define void @global_atomic_cmpxchg_i32_ret_v_av__av(ptr addrspace(1) %ptr) #0 { |
| ; CHECK-LABEL: global_atomic_cmpxchg_i32_ret_v_av__av: |
| ; CHECK: ; %bb.0: |
| ; CHECK-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0) |
| ; CHECK-NEXT: ;;#ASMSTART |
| ; CHECK-NEXT: ; def v[4:5] |
| ; CHECK-NEXT: ;;#ASMEND |
| ; CHECK-NEXT: ;;#ASMSTART |
| ; CHECK-NEXT: ; def v[2:3] |
| ; CHECK-NEXT: ;;#ASMEND |
| ; CHECK-NEXT: buffer_wbl2 |
| ; CHECK-NEXT: global_atomic_cmpswap_x2 v[0:1], v[0:1], v[2:5], off offset:80 glc |
| ; CHECK-NEXT: s_waitcnt vmcnt(0) |
| ; CHECK-NEXT: buffer_invl2 |
| ; CHECK-NEXT: buffer_wbinvl1_vol |
| ; CHECK-NEXT: ;;#ASMSTART |
| ; CHECK-NEXT: ; use v[0:1] |
| ; CHECK-NEXT: ;;#ASMEND |
| ; CHECK-NEXT: s_setpc_b64 s[30:31] |
| %gep.0 = getelementptr inbounds [512 x i64], ptr addrspace(1) %ptr, i64 0, i64 10 |
| %data0 = call i64 asm "; def $0", "=v"() |
| %data1 = call i64 asm "; def $0", "=^VA"() |
| %pair = cmpxchg ptr addrspace(1) %gep.0, i64 %data0, i64 %data1 seq_cst monotonic |
| %result = extractvalue { i64, i1 } %pair, 0 |
| call void asm "; use $0", "^VA"(i64 %result) |
| ret void |
| } |
| |
| define void @global_atomic_cmpxchg_i32_ret_av_a__av(ptr addrspace(1) %ptr) #0 { |
| ; CHECK-LABEL: global_atomic_cmpxchg_i32_ret_av_a__av: |
| ; CHECK: ; %bb.0: |
| ; CHECK-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0) |
| ; CHECK-NEXT: ;;#ASMSTART |
| ; CHECK-NEXT: ; def a[0:1] |
| ; CHECK-NEXT: ;;#ASMEND |
| ; CHECK-NEXT: v_accvgpr_read_b32 v3, a1 |
| ; CHECK-NEXT: v_accvgpr_read_b32 v2, a0 |
| ; CHECK-NEXT: ;;#ASMSTART |
| ; CHECK-NEXT: ; def v[4:5] |
| ; CHECK-NEXT: ;;#ASMEND |
| ; CHECK-NEXT: buffer_wbl2 |
| ; CHECK-NEXT: global_atomic_cmpswap_x2 v[0:1], v[0:1], v[2:5], off offset:80 glc |
| ; CHECK-NEXT: s_waitcnt vmcnt(0) |
| ; CHECK-NEXT: buffer_invl2 |
| ; CHECK-NEXT: buffer_wbinvl1_vol |
| ; CHECK-NEXT: ;;#ASMSTART |
| ; CHECK-NEXT: ; use v[0:1] |
| ; CHECK-NEXT: ;;#ASMEND |
| ; CHECK-NEXT: s_setpc_b64 s[30:31] |
| %gep.0 = getelementptr inbounds [512 x i64], ptr addrspace(1) %ptr, i64 0, i64 10 |
| %data0 = call i64 asm "; def $0", "=^VA"() |
| %data1 = call i64 asm "; def $0", "=a"() |
| %pair = cmpxchg ptr addrspace(1) %gep.0, i64 %data0, i64 %data1 seq_cst monotonic |
| %result = extractvalue { i64, i1 } %pair, 0 |
| call void asm "; use $0", "^VA"(i64 %result) |
| ret void |
| } |
| |
| define void @global_atomic_cmpxchg_i32_ret_a_av__av(ptr addrspace(1) %ptr) #0 { |
| ; CHECK-LABEL: global_atomic_cmpxchg_i32_ret_a_av__av: |
| ; CHECK: ; %bb.0: |
| ; CHECK-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0) |
| ; CHECK-NEXT: ;;#ASMSTART |
| ; CHECK-NEXT: ; def a[0:1] |
| ; CHECK-NEXT: ;;#ASMEND |
| ; CHECK-NEXT: v_accvgpr_read_b32 v5, a1 |
| ; CHECK-NEXT: v_accvgpr_read_b32 v4, a0 |
| ; CHECK-NEXT: ;;#ASMSTART |
| ; CHECK-NEXT: ; def v[2:3] |
| ; CHECK-NEXT: ;;#ASMEND |
| ; CHECK-NEXT: buffer_wbl2 |
| ; CHECK-NEXT: global_atomic_cmpswap_x2 v[0:1], v[0:1], v[2:5], off offset:80 glc |
| ; CHECK-NEXT: s_waitcnt vmcnt(0) |
| ; CHECK-NEXT: buffer_invl2 |
| ; CHECK-NEXT: buffer_wbinvl1_vol |
| ; CHECK-NEXT: ;;#ASMSTART |
| ; CHECK-NEXT: ; use v[0:1] |
| ; CHECK-NEXT: ;;#ASMEND |
| ; CHECK-NEXT: s_setpc_b64 s[30:31] |
| %gep.0 = getelementptr inbounds [512 x i64], ptr addrspace(1) %ptr, i64 0, i64 10 |
| %data0 = call i64 asm "; def $0", "=a"() |
| %data1 = call i64 asm "; def $0", "=^VA"() |
| %pair = cmpxchg ptr addrspace(1) %gep.0, i64 %data0, i64 %data1 seq_cst monotonic |
| %result = extractvalue { i64, i1 } %pair, 0 |
| call void asm "; use $0", "^VA"(i64 %result) |
| ret void |
| } |
| |
| ;--------------------------------------------------------------------- |
| ; i64 cases |
| ;--------------------------------------------------------------------- |
| |
| define void @global_atomic_cmpxchg_i64_ret_av_av__av(ptr addrspace(1) %ptr) #0 { |
| ; CHECK-LABEL: global_atomic_cmpxchg_i64_ret_av_av__av: |
| ; CHECK: ; %bb.0: |
| ; CHECK-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0) |
| ; CHECK-NEXT: ;;#ASMSTART |
| ; CHECK-NEXT: ; def v[4:5] |
| ; CHECK-NEXT: ;;#ASMEND |
| ; CHECK-NEXT: ;;#ASMSTART |
| ; CHECK-NEXT: ; def v[2:3] |
| ; CHECK-NEXT: ;;#ASMEND |
| ; CHECK-NEXT: buffer_wbl2 |
| ; CHECK-NEXT: global_atomic_cmpswap_x2 v[0:1], v[0:1], v[2:5], off offset:80 glc |
| ; CHECK-NEXT: s_waitcnt vmcnt(0) |
| ; CHECK-NEXT: buffer_invl2 |
| ; CHECK-NEXT: buffer_wbinvl1_vol |
| ; CHECK-NEXT: ;;#ASMSTART |
| ; CHECK-NEXT: ; use v[0:1] |
| ; CHECK-NEXT: ;;#ASMEND |
| ; CHECK-NEXT: s_setpc_b64 s[30:31] |
| %gep.0 = getelementptr inbounds [512 x i64], ptr addrspace(1) %ptr, i64 0, i64 10 |
| %data0 = call i64 asm "; def $0", "=^VA"() |
| %data1 = call i64 asm "; def $0", "=^VA"() |
| %pair = cmpxchg ptr addrspace(1) %gep.0, i64 %data0, i64 %data1 seq_cst monotonic |
| %result = extractvalue { i64, i1 } %pair, 0 |
| call void asm "; use $0", "^VA"(i64 %result) |
| ret void |
| } |
| |
| define void @global_atomic_cmpxchg_i64_ret_av_av__v(ptr addrspace(1) %ptr) #0 { |
| ; CHECK-LABEL: global_atomic_cmpxchg_i64_ret_av_av__v: |
| ; CHECK: ; %bb.0: |
| ; CHECK-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0) |
| ; CHECK-NEXT: ;;#ASMSTART |
| ; CHECK-NEXT: ; def v[4:5] |
| ; CHECK-NEXT: ;;#ASMEND |
| ; CHECK-NEXT: ;;#ASMSTART |
| ; CHECK-NEXT: ; def v[2:3] |
| ; CHECK-NEXT: ;;#ASMEND |
| ; CHECK-NEXT: buffer_wbl2 |
| ; CHECK-NEXT: global_atomic_cmpswap_x2 v[0:1], v[0:1], v[2:5], off offset:80 glc |
| ; CHECK-NEXT: s_waitcnt vmcnt(0) |
| ; CHECK-NEXT: buffer_invl2 |
| ; CHECK-NEXT: buffer_wbinvl1_vol |
| ; CHECK-NEXT: ;;#ASMSTART |
| ; CHECK-NEXT: ; use v[0:1] |
| ; CHECK-NEXT: ;;#ASMEND |
| ; CHECK-NEXT: s_setpc_b64 s[30:31] |
| %gep.0 = getelementptr inbounds [512 x i64], ptr addrspace(1) %ptr, i64 0, i64 10 |
| %data0 = call i64 asm "; def $0", "=^VA"() |
| %data1 = call i64 asm "; def $0", "=^VA"() |
| %pair = cmpxchg ptr addrspace(1) %gep.0, i64 %data0, i64 %data1 seq_cst monotonic |
| %result = extractvalue { i64, i1 } %pair, 0 |
| call void asm "; use $0", "v"(i64 %result) |
| ret void |
| } |
| |
| define void @global_atomic_cmpxchg_i64_ret_av_av__a(ptr addrspace(1) %ptr) #0 { |
| ; CHECK-LABEL: global_atomic_cmpxchg_i64_ret_av_av__a: |
| ; CHECK: ; %bb.0: |
| ; CHECK-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0) |
| ; CHECK-NEXT: ;;#ASMSTART |
| ; CHECK-NEXT: ; def v[4:5] |
| ; CHECK-NEXT: ;;#ASMEND |
| ; CHECK-NEXT: ;;#ASMSTART |
| ; CHECK-NEXT: ; def v[2:3] |
| ; CHECK-NEXT: ;;#ASMEND |
| ; CHECK-NEXT: buffer_wbl2 |
| ; CHECK-NEXT: global_atomic_cmpswap_x2 v[0:1], v[0:1], v[2:5], off offset:80 glc |
| ; CHECK-NEXT: s_waitcnt vmcnt(0) |
| ; CHECK-NEXT: buffer_invl2 |
| ; CHECK-NEXT: buffer_wbinvl1_vol |
| ; CHECK-NEXT: v_accvgpr_write_b32 a0, v0 |
| ; CHECK-NEXT: v_accvgpr_write_b32 a1, v1 |
| ; CHECK-NEXT: ;;#ASMSTART |
| ; CHECK-NEXT: ; use a[0:1] |
| ; CHECK-NEXT: ;;#ASMEND |
| ; CHECK-NEXT: s_setpc_b64 s[30:31] |
| %gep.0 = getelementptr inbounds [512 x i64], ptr addrspace(1) %ptr, i64 0, i64 10 |
| %data0 = call i64 asm "; def $0", "=^VA"() |
| %data1 = call i64 asm "; def $0", "=^VA"() |
| %pair = cmpxchg ptr addrspace(1) %gep.0, i64 %data0, i64 %data1 seq_cst monotonic |
| %result = extractvalue { i64, i1 } %pair, 0 |
| call void asm "; use $0", "a"(i64 %result) |
| ret void |
| } |
| |
| define void @global_atomic_cmpxchg_i64_ret_a_a__a(ptr addrspace(1) %ptr) #0 { |
| ; CHECK-LABEL: global_atomic_cmpxchg_i64_ret_a_a__a: |
| ; CHECK: ; %bb.0: |
| ; CHECK-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0) |
| ; CHECK-NEXT: ;;#ASMSTART |
| ; CHECK-NEXT: ; def a[0:1] |
| ; CHECK-NEXT: ;;#ASMEND |
| ; CHECK-NEXT: v_accvgpr_read_b32 v5, a1 |
| ; CHECK-NEXT: v_accvgpr_read_b32 v4, a0 |
| ; CHECK-NEXT: ;;#ASMSTART |
| ; CHECK-NEXT: ; def a[0:1] |
| ; CHECK-NEXT: ;;#ASMEND |
| ; CHECK-NEXT: v_accvgpr_read_b32 v3, a1 |
| ; CHECK-NEXT: v_accvgpr_read_b32 v2, a0 |
| ; CHECK-NEXT: buffer_wbl2 |
| ; CHECK-NEXT: global_atomic_cmpswap_x2 v[0:1], v[0:1], v[2:5], off offset:80 glc |
| ; CHECK-NEXT: s_waitcnt vmcnt(0) |
| ; CHECK-NEXT: buffer_invl2 |
| ; CHECK-NEXT: buffer_wbinvl1_vol |
| ; CHECK-NEXT: v_accvgpr_write_b32 a0, v0 |
| ; CHECK-NEXT: v_accvgpr_write_b32 a1, v1 |
| ; CHECK-NEXT: ;;#ASMSTART |
| ; CHECK-NEXT: ; use a[0:1] |
| ; CHECK-NEXT: ;;#ASMEND |
| ; CHECK-NEXT: s_setpc_b64 s[30:31] |
| %gep.0 = getelementptr inbounds [512 x i64], ptr addrspace(1) %ptr, i64 0, i64 10 |
| %data0 = call i64 asm "; def $0", "=a"() |
| %data1 = call i64 asm "; def $0", "=a"() |
| %pair = cmpxchg ptr addrspace(1) %gep.0, i64 %data0, i64 %data1 seq_cst monotonic |
| %result = extractvalue { i64, i1 } %pair, 0 |
| call void asm "; use $0", "a"(i64 %result) |
| ret void |
| } |
| |
| define void @global_atomic_cmpxchg_i64_ret_a_a__v(ptr addrspace(1) %ptr) #0 { |
| ; CHECK-LABEL: global_atomic_cmpxchg_i64_ret_a_a__v: |
| ; CHECK: ; %bb.0: |
| ; CHECK-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0) |
| ; CHECK-NEXT: ;;#ASMSTART |
| ; CHECK-NEXT: ; def a[0:1] |
| ; CHECK-NEXT: ;;#ASMEND |
| ; CHECK-NEXT: v_accvgpr_read_b32 v5, a1 |
| ; CHECK-NEXT: v_accvgpr_read_b32 v4, a0 |
| ; CHECK-NEXT: ;;#ASMSTART |
| ; CHECK-NEXT: ; def a[0:1] |
| ; CHECK-NEXT: ;;#ASMEND |
| ; CHECK-NEXT: v_accvgpr_read_b32 v3, a1 |
| ; CHECK-NEXT: v_accvgpr_read_b32 v2, a0 |
| ; CHECK-NEXT: buffer_wbl2 |
| ; CHECK-NEXT: global_atomic_cmpswap_x2 v[0:1], v[0:1], v[2:5], off offset:80 glc |
| ; CHECK-NEXT: s_waitcnt vmcnt(0) |
| ; CHECK-NEXT: buffer_invl2 |
| ; CHECK-NEXT: buffer_wbinvl1_vol |
| ; CHECK-NEXT: ;;#ASMSTART |
| ; CHECK-NEXT: ; use v[0:1] |
| ; CHECK-NEXT: ;;#ASMEND |
| ; CHECK-NEXT: s_setpc_b64 s[30:31] |
| %gep.0 = getelementptr inbounds [512 x i64], ptr addrspace(1) %ptr, i64 0, i64 10 |
| %data0 = call i64 asm "; def $0", "=a"() |
| %data1 = call i64 asm "; def $0", "=a"() |
| %pair = cmpxchg ptr addrspace(1) %gep.0, i64 %data0, i64 %data1 seq_cst monotonic |
| %result = extractvalue { i64, i1 } %pair, 0 |
| call void asm "; use $0", "v"(i64 %result) |
| ret void |
| } |
| |
| define void @global_atomic_cmpxchg_i64_ret_v_a__v(ptr addrspace(1) %ptr) #0 { |
| ; CHECK-LABEL: global_atomic_cmpxchg_i64_ret_v_a__v: |
| ; CHECK: ; %bb.0: |
| ; CHECK-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0) |
| ; CHECK-NEXT: ;;#ASMSTART |
| ; CHECK-NEXT: ; def a[0:1] |
| ; CHECK-NEXT: ;;#ASMEND |
| ; CHECK-NEXT: v_accvgpr_read_b32 v3, a1 |
| ; CHECK-NEXT: v_accvgpr_read_b32 v2, a0 |
| ; CHECK-NEXT: ;;#ASMSTART |
| ; CHECK-NEXT: ; def v[4:5] |
| ; CHECK-NEXT: ;;#ASMEND |
| ; CHECK-NEXT: buffer_wbl2 |
| ; CHECK-NEXT: global_atomic_cmpswap_x2 v[0:1], v[0:1], v[2:5], off offset:80 glc |
| ; CHECK-NEXT: s_waitcnt vmcnt(0) |
| ; CHECK-NEXT: buffer_invl2 |
| ; CHECK-NEXT: buffer_wbinvl1_vol |
| ; CHECK-NEXT: ;;#ASMSTART |
| ; CHECK-NEXT: ; use v[0:1] |
| ; CHECK-NEXT: ;;#ASMEND |
| ; CHECK-NEXT: s_setpc_b64 s[30:31] |
| %gep.0 = getelementptr inbounds [512 x i64], ptr addrspace(1) %ptr, i64 0, i64 10 |
| %data0 = call i64 asm "; def $0", "=v"() |
| %data1 = call i64 asm "; def $0", "=a"() |
| %pair = cmpxchg ptr addrspace(1) %gep.0, i64 %data0, i64 %data1 seq_cst monotonic |
| %result = extractvalue { i64, i1 } %pair, 0 |
| call void asm "; use $0", "v"(i64 %result) |
| ret void |
| } |
| |
| define void @global_atomic_cmpxchg_i64_ret_a_v__v(ptr addrspace(1) %ptr) #0 { |
| ; CHECK-LABEL: global_atomic_cmpxchg_i64_ret_a_v__v: |
| ; CHECK: ; %bb.0: |
| ; CHECK-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0) |
| ; CHECK-NEXT: ;;#ASMSTART |
| ; CHECK-NEXT: ; def a[0:1] |
| ; CHECK-NEXT: ;;#ASMEND |
| ; CHECK-NEXT: v_accvgpr_read_b32 v5, a1 |
| ; CHECK-NEXT: v_accvgpr_read_b32 v4, a0 |
| ; CHECK-NEXT: ;;#ASMSTART |
| ; CHECK-NEXT: ; def v[2:3] |
| ; CHECK-NEXT: ;;#ASMEND |
| ; CHECK-NEXT: buffer_wbl2 |
| ; CHECK-NEXT: global_atomic_cmpswap_x2 v[0:1], v[0:1], v[2:5], off offset:80 glc |
| ; CHECK-NEXT: s_waitcnt vmcnt(0) |
| ; CHECK-NEXT: buffer_invl2 |
| ; CHECK-NEXT: buffer_wbinvl1_vol |
| ; CHECK-NEXT: ;;#ASMSTART |
| ; CHECK-NEXT: ; use v[0:1] |
| ; CHECK-NEXT: ;;#ASMEND |
| ; CHECK-NEXT: s_setpc_b64 s[30:31] |
| %gep.0 = getelementptr inbounds [512 x i64], ptr addrspace(1) %ptr, i64 0, i64 10 |
| %data0 = call i64 asm "; def $0", "=a"() |
| %data1 = call i64 asm "; def $0", "=v"() |
| %pair = cmpxchg ptr addrspace(1) %gep.0, i64 %data0, i64 %data1 seq_cst monotonic |
| %result = extractvalue { i64, i1 } %pair, 0 |
| call void asm "; use $0", "v"(i64 %result) |
| ret void |
| } |
| |
| define void @global_atomic_cmpxchg_i64_ret_v_v__a(ptr addrspace(1) %ptr) #0 { |
| ; CHECK-LABEL: global_atomic_cmpxchg_i64_ret_v_v__a: |
| ; CHECK: ; %bb.0: |
| ; CHECK-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0) |
| ; CHECK-NEXT: ;;#ASMSTART |
| ; CHECK-NEXT: ; def v[4:5] |
| ; CHECK-NEXT: ;;#ASMEND |
| ; CHECK-NEXT: ;;#ASMSTART |
| ; CHECK-NEXT: ; def v[2:3] |
| ; CHECK-NEXT: ;;#ASMEND |
| ; CHECK-NEXT: buffer_wbl2 |
| ; CHECK-NEXT: global_atomic_cmpswap_x2 v[0:1], v[0:1], v[2:5], off offset:80 glc |
| ; CHECK-NEXT: s_waitcnt vmcnt(0) |
| ; CHECK-NEXT: buffer_invl2 |
| ; CHECK-NEXT: buffer_wbinvl1_vol |
| ; CHECK-NEXT: v_accvgpr_write_b32 a0, v0 |
| ; CHECK-NEXT: v_accvgpr_write_b32 a1, v1 |
| ; CHECK-NEXT: ;;#ASMSTART |
| ; CHECK-NEXT: ; use a[0:1] |
| ; CHECK-NEXT: ;;#ASMEND |
| ; CHECK-NEXT: s_setpc_b64 s[30:31] |
| %gep.0 = getelementptr inbounds [512 x i64], ptr addrspace(1) %ptr, i64 0, i64 10 |
| %data0 = call i64 asm "; def $0", "=v"() |
| %data1 = call i64 asm "; def $0", "=v"() |
| %pair = cmpxchg ptr addrspace(1) %gep.0, i64 %data0, i64 %data1 seq_cst monotonic |
| %result = extractvalue { i64, i1 } %pair, 0 |
| call void asm "; use $0", "a"(i64 %result) |
| ret void |
| } |
| |
| define void @global_atomic_cmpxchg_i64_ret_av_v__av(ptr addrspace(1) %ptr) #0 { |
| ; CHECK-LABEL: global_atomic_cmpxchg_i64_ret_av_v__av: |
| ; CHECK: ; %bb.0: |
| ; CHECK-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0) |
| ; CHECK-NEXT: ;;#ASMSTART |
| ; CHECK-NEXT: ; def v[4:5] |
| ; CHECK-NEXT: ;;#ASMEND |
| ; CHECK-NEXT: ;;#ASMSTART |
| ; CHECK-NEXT: ; def v[2:3] |
| ; CHECK-NEXT: ;;#ASMEND |
| ; CHECK-NEXT: buffer_wbl2 |
| ; CHECK-NEXT: global_atomic_cmpswap_x2 v[0:1], v[0:1], v[2:5], off offset:80 glc |
| ; CHECK-NEXT: s_waitcnt vmcnt(0) |
| ; CHECK-NEXT: buffer_invl2 |
| ; CHECK-NEXT: buffer_wbinvl1_vol |
| ; CHECK-NEXT: ;;#ASMSTART |
| ; CHECK-NEXT: ; use v[0:1] |
| ; CHECK-NEXT: ;;#ASMEND |
| ; CHECK-NEXT: s_setpc_b64 s[30:31] |
| %gep.0 = getelementptr inbounds [512 x i64], ptr addrspace(1) %ptr, i64 0, i64 10 |
| %data0 = call i64 asm "; def $0", "=^VA"() |
| %data1 = call i64 asm "; def $0", "=v"() |
| %pair = cmpxchg ptr addrspace(1) %gep.0, i64 %data0, i64 %data1 seq_cst monotonic |
| %result = extractvalue { i64, i1 } %pair, 0 |
| call void asm "; use $0", "^VA"(i64 %result) |
| ret void |
| } |
| |
| define void @global_atomic_cmpxchg_i64_ret_v_av__av(ptr addrspace(1) %ptr) #0 { |
| ; CHECK-LABEL: global_atomic_cmpxchg_i64_ret_v_av__av: |
| ; CHECK: ; %bb.0: |
| ; CHECK-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0) |
| ; CHECK-NEXT: ;;#ASMSTART |
| ; CHECK-NEXT: ; def v[4:5] |
| ; CHECK-NEXT: ;;#ASMEND |
| ; CHECK-NEXT: ;;#ASMSTART |
| ; CHECK-NEXT: ; def v[2:3] |
| ; CHECK-NEXT: ;;#ASMEND |
| ; CHECK-NEXT: buffer_wbl2 |
| ; CHECK-NEXT: global_atomic_cmpswap_x2 v[0:1], v[0:1], v[2:5], off offset:80 glc |
| ; CHECK-NEXT: s_waitcnt vmcnt(0) |
| ; CHECK-NEXT: buffer_invl2 |
| ; CHECK-NEXT: buffer_wbinvl1_vol |
| ; CHECK-NEXT: ;;#ASMSTART |
| ; CHECK-NEXT: ; use v[0:1] |
| ; CHECK-NEXT: ;;#ASMEND |
| ; CHECK-NEXT: s_setpc_b64 s[30:31] |
| %gep.0 = getelementptr inbounds [512 x i64], ptr addrspace(1) %ptr, i64 0, i64 10 |
| %data0 = call i64 asm "; def $0", "=v"() |
| %data1 = call i64 asm "; def $0", "=^VA"() |
| %pair = cmpxchg ptr addrspace(1) %gep.0, i64 %data0, i64 %data1 seq_cst monotonic |
| %result = extractvalue { i64, i1 } %pair, 0 |
| call void asm "; use $0", "^VA"(i64 %result) |
| ret void |
| } |
| |
| define void @global_atomic_cmpxchg_i64_ret_av_a__av(ptr addrspace(1) %ptr) #0 { |
| ; CHECK-LABEL: global_atomic_cmpxchg_i64_ret_av_a__av: |
| ; CHECK: ; %bb.0: |
| ; CHECK-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0) |
| ; CHECK-NEXT: ;;#ASMSTART |
| ; CHECK-NEXT: ; def a[0:1] |
| ; CHECK-NEXT: ;;#ASMEND |
| ; CHECK-NEXT: v_accvgpr_read_b32 v3, a1 |
| ; CHECK-NEXT: v_accvgpr_read_b32 v2, a0 |
| ; CHECK-NEXT: ;;#ASMSTART |
| ; CHECK-NEXT: ; def v[4:5] |
| ; CHECK-NEXT: ;;#ASMEND |
| ; CHECK-NEXT: buffer_wbl2 |
| ; CHECK-NEXT: global_atomic_cmpswap_x2 v[0:1], v[0:1], v[2:5], off offset:80 glc |
| ; CHECK-NEXT: s_waitcnt vmcnt(0) |
| ; CHECK-NEXT: buffer_invl2 |
| ; CHECK-NEXT: buffer_wbinvl1_vol |
| ; CHECK-NEXT: ;;#ASMSTART |
| ; CHECK-NEXT: ; use v[0:1] |
| ; CHECK-NEXT: ;;#ASMEND |
| ; CHECK-NEXT: s_setpc_b64 s[30:31] |
| %gep.0 = getelementptr inbounds [512 x i64], ptr addrspace(1) %ptr, i64 0, i64 10 |
| %data0 = call i64 asm "; def $0", "=^VA"() |
| %data1 = call i64 asm "; def $0", "=a"() |
| %pair = cmpxchg ptr addrspace(1) %gep.0, i64 %data0, i64 %data1 seq_cst monotonic |
| %result = extractvalue { i64, i1 } %pair, 0 |
| call void asm "; use $0", "^VA"(i64 %result) |
| ret void |
| } |
| |
| define void @global_atomic_cmpxchg_i64_ret_a_av__av(ptr addrspace(1) %ptr) #0 { |
| ; CHECK-LABEL: global_atomic_cmpxchg_i64_ret_a_av__av: |
| ; CHECK: ; %bb.0: |
| ; CHECK-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0) |
| ; CHECK-NEXT: ;;#ASMSTART |
| ; CHECK-NEXT: ; def a[0:1] |
| ; CHECK-NEXT: ;;#ASMEND |
| ; CHECK-NEXT: v_accvgpr_read_b32 v5, a1 |
| ; CHECK-NEXT: v_accvgpr_read_b32 v4, a0 |
| ; CHECK-NEXT: ;;#ASMSTART |
| ; CHECK-NEXT: ; def v[2:3] |
| ; CHECK-NEXT: ;;#ASMEND |
| ; CHECK-NEXT: buffer_wbl2 |
| ; CHECK-NEXT: global_atomic_cmpswap_x2 v[0:1], v[0:1], v[2:5], off offset:80 glc |
| ; CHECK-NEXT: s_waitcnt vmcnt(0) |
| ; CHECK-NEXT: buffer_invl2 |
| ; CHECK-NEXT: buffer_wbinvl1_vol |
| ; CHECK-NEXT: ;;#ASMSTART |
| ; CHECK-NEXT: ; use v[0:1] |
| ; CHECK-NEXT: ;;#ASMEND |
| ; CHECK-NEXT: s_setpc_b64 s[30:31] |
| %gep.0 = getelementptr inbounds [512 x i64], ptr addrspace(1) %ptr, i64 0, i64 10 |
| %data0 = call i64 asm "; def $0", "=a"() |
| %data1 = call i64 asm "; def $0", "=^VA"() |
| %pair = cmpxchg ptr addrspace(1) %gep.0, i64 %data0, i64 %data1 seq_cst monotonic |
| %result = extractvalue { i64, i1 } %pair, 0 |
| call void asm "; use $0", "^VA"(i64 %result) |
| ret void |
| } |
| |
| attributes #0 = { nounwind "amdgpu-waves-per-eu"="10,10" } |