Skip to content

Commit

Permalink
Use plain llvmcall calling convention for WMMA intrinsics. (#1709)
Browse files Browse the repository at this point in the history
  • Loading branch information
maleadt committed Jan 5, 2023
1 parent 84aea71 commit 90df1a6
Showing 1 changed file with 3 additions and 3 deletions.
6 changes: 3 additions & 3 deletions src/device/intrinsics/wmma.jl
Original file line number Diff line number Diff line change
Expand Up @@ -191,7 +191,7 @@ for ops in all_ldst_ops,
# Determine types + size for this (matrix, elem_type) combination
arr_ty, frag_ty, sz = get_frag_info(mat, elem_type, shape)

ccall_name = "extern $llvm_intr"
ccall_name = "$llvm_intr"

ptr_ty = LLVMPtr{arr_ty, addr_space_int}
struct_ty = Symbol("LLVMStruct$sz")
Expand Down Expand Up @@ -253,7 +253,7 @@ export llvm_wmma_store
# Determine types + size for this (matrix, elem_type) combination
arr_ty, frag_ty, sz = get_frag_info(mat, elem_type, shape)

ccall_name = "extern $llvm_intr"
ccall_name = "$llvm_intr"
frag_types = ntuple(i -> frag_ty, sz)
frag_vars = ntuple(i -> :(data[$i]), sz)

Expand Down Expand Up @@ -325,7 +325,7 @@ for ops in all_wmma_ops,
c_arr_ty, c_frag_ty, c_sz = get_frag_info("c", c_elem_type, shape)
d_arr_ty, d_frag_ty, d_sz = get_frag_info("d", d_elem_type, shape)

ccall_name = "extern $llvm_intr"
ccall_name = "$llvm_intr"

a_types = ntuple(i -> a_frag_ty, a_sz)
b_types = ntuple(i -> b_frag_ty, b_sz)
Expand Down

0 comments on commit 90df1a6

Please sign in to comment.