Last active
April 17, 2025 11:28
-
-
Save chudur-budur/cbf24834f22c23e9aec0c2fbcfde1b0d to your computer and use it in GitHub Desktop.
Testing linalg.matmul mlir-gpu backend
This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
# This is the mlir code that I was trying to compile | |
module { | |
func @matmul_linalg(%A: memref<8x8xf32>, %B: memref<8x8xf32>, %C: memref<8x8xf32>) { | |
linalg.matmul ins(%A, %B : memref<8x8xf32>, memref<8x8xf32>) | |
outs(%C: memref<8x8xf32>) | |
return | |
} | |
func @main() { | |
%A = memref.alloc() : memref<8x8xf32> | |
%B = memref.alloc() : memref<8x8xf32> | |
%C = memref.alloc() : memref<8x8xf32> | |
%cf1 = constant 1.0 : f32 | |
linalg.fill(%A, %cf1) : memref<8x8xf32>, f32 | |
linalg.fill(%B, %cf1) : memref<8x8xf32>, f32 | |
linalg.fill(%C, %cf1) : memref<8x8xf32>, f32 | |
call @matmul_linalg(%A, %B, %C) : (memref<8x8xf32>, memref<8x8xf32>, memref<8x8xf32>) -> () | |
return | |
} | |
} |
This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
#!/bin/bash | |
# This is the script to compile the above code. | |
mlir-opt matmul-gpu-02.mlir.in \ | |
--linalg-tile-to-parallel-loops="linalg-tile-sizes=4,2" \ | |
--convert-linalg-to-parallel-loops \ | |
--test-gpu-greedy-parallel-loop-mapping \ | |
--convert-parallel-loops-to-gpu \ | |
--gpu-kernel-outlining \ | |
--lower-affine \ | |
--convert-scf-to-std \ | |
--canonicalize \ | |
--pass-pipeline="gpu.module(strip-debuginfo, convert-gpu-to-nvvm, gpu-to-cubin)" \ | |
--gpu-to-llvm 2>&1 >matmul-gpu-02.mlir.out | |
mlir-translate matmul-gpu-02.mlir.out --mlir-to-llvmir | opt -O3 -S | llc -O3 | as - -o matmul-gpu-02.mlir.o | |
# Works up to this point. | |
# Then when I try to compile it to executable, | |
clang++-11 matmul-gpu-02.mlir.o -lcuda \ | |
$HOME/opt/llvm/lib/libmlir_cuda_runtime.so \ | |
$HOME/opt/llvm/lib/libmlir_runner_utils.so \ | |
-o matmul-gpu-02 | |
# It gives these errors: | |
# 'cuStreamSynchronize(stream)' failed with 'CUDA_ERROR_ILLEGAL_ADDRESS' | |
# 'cuStreamDestroy(stream)' failed with 'CUDA_ERROR_ILLEGAL_ADDRESS' | |
# 'cuModuleUnload(module)' failed with 'CUDA_ERROR_ILLEGAL_ADDRESS' | |
# 'cuModuleLoadData(&module, data)' failed with 'CUDA_ERROR_ILLEGAL_ADDRESS' | |
# 'cuModuleGetFunction(&function, module, name)' failed with 'CUDA_ERROR_INVALID_HANDLE' | |
# 'cuStreamCreate(&stream, CU_STREAM_NON_BLOCKING)' failed with 'CUDA_ERROR_ILLEGAL_ADDRESS' | |
# 'cuLaunchKernel(function, gridX, gridY, gridZ, blockX, blockY, blockZ, smem, stream, params, extra)' failed with 'CUDA_ERROR_INVALID_HANDLE' | |
# 'cuStreamSynchronize(stream)' failed with 'CUDA_ERROR_INVALID_HANDLE' | |
# 'cuStreamDestroy(stream)' failed with 'CUDA_ERROR_INVALID_HANDLE' | |
# 'cuModuleUnload(module)' failed with 'CUDA_ERROR_INVALID_HANDLE' | |
# 'cuModuleLoadData(&module, data)' failed with 'CUDA_ERROR_ILLEGAL_ADDRESS' | |
# 'cuModuleGetFunction(&function, module, name)' failed with 'CUDA_ERROR_INVALID_HANDLE' | |
# 'cuStreamCreate(&stream, CU_STREAM_NON_BLOCKING)' failed with 'CUDA_ERROR_ILLEGAL_ADDRESS' | |
# 'cuLaunchKernel(function, gridX, gridY, gridZ, blockX, blockY, blockZ, smem, stream, params, extra)' failed with 'CUDA_ERROR_INVALID_HANDLE' | |
# 'cuStreamSynchronize(stream)' failed with 'CUDA_ERROR_INVALID_HANDLE' | |
# 'cuStreamDestroy(stream)' failed with 'CUDA_ERROR_INVALID_HANDLE' | |
# 'cuModuleUnload(module)' failed with 'CUDA_ERROR_INVALID_HANDLE' | |
# 'cuModuleLoadData(&module, data)' failed with 'CUDA_ERROR_ILLEGAL_ADDRESS' | |
# 'cuModuleGetFunction(&function, module, name)' failed with 'CUDA_ERROR_INVALID_HANDLE' | |
# 'cuStreamCreate(&stream, CU_STREAM_NON_BLOCKING)' failed with 'CUDA_ERROR_ILLEGAL_ADDRESS' | |
# 'cuLaunchKernel(function, gridX, gridY, gridZ, blockX, blockY, blockZ, smem, stream, params, extra)' failed with 'CUDA_ERROR_INVALID_HANDLE' | |
# 'cuStreamSynchronize(stream)' failed with 'CUDA_ERROR_INVALID_HANDLE' | |
# 'cuStreamDestroy(stream)' failed with 'CUDA_ERROR_INVALID_HANDLE' | |
# 'cuModuleUnload(module)' failed with 'CUDA_ERROR_INVALID_HANDLE' |
Sign up for free
to join this conversation on GitHub.
Already have an account?
Sign in to comment