Skip to content

Commit

Permalink
Merge branch 'lcambier/lto_symbol_fix' into 'main'
Browse files Browse the repository at this point in the history
tile_matmul: ensure lto_symbol differs for different arch & num_threads

See merge request omniverse/warp!844
  • Loading branch information
nvlukasz committed Nov 6, 2024
2 parents ee98d28 + 92ed3c1 commit 6b3023e
Showing 1 changed file with 1 addition and 3 deletions.
4 changes: 1 addition & 3 deletions warp/builtins.py
Original file line number Diff line number Diff line change
Expand Up @@ -5681,9 +5681,7 @@ def make_function(M, N, K, adtype, bdtype, cdtype, alayout, blayout, clayout):
raise RuntimeError("time_matmul(A, B, C) requires all inputs to be real or complex")
element_type = a_type

lto_symbol = (
f"dot_{M}_{N}_{K}_{a_arrangement}_{b_arrangement}_{c_arrangement}_{a_prec}_{b_prec}_{c_prec}_{element_type}"
)
lto_symbol = f"dot_{M}_{N}_{K}_{arch}_{num_threads}_{a_arrangement}_{b_arrangement}_{c_arrangement}_{a_prec}_{b_prec}_{c_prec}_{element_type}"

# early out if LTO for this combination already exists for this module
if lto_symbol in builder.ltoirs:
Expand Down

0 comments on commit 6b3023e

Please sign in to comment.