diff --git a/community/blog/2024-01-22-exploring-cpu-microkernels-on-a-matmul-example/index.html b/community/blog/2024-01-22-exploring-cpu-microkernels-on-a-matmul-example/index.html index 49557e3947fd..c885e32f37fd 100755 --- a/community/blog/2024-01-22-exploring-cpu-microkernels-on-a-matmul-example/index.html +++ b/community/blog/2024-01-22-exploring-cpu-microkernels-on-a-matmul-example/index.html @@ -3551,8 +3551,7 @@ - -
// -----// IR Dump After LowerUKernelOpsToCalls (iree-codegen-lower-ukernel-ops-to-calls) //----- //
module {
func.func private @iree_uk_mmt4d(memref<f32>, index, index, memref<f32>, index, index, memref<f32>, index, index, index, index, index, i32, i32, i32, i32) attributes {hal.import.bitcode = true, hal.import.cconv = 1 : i32, hal.import.fields = ["processor_data"], llvm.bareptr = true}
@@ -5152,7 +5140,7 @@ Ukernel bitcode: tile function ret void
}
...optimized.bc
, disassembled to ...optimized.ll
link...optimized.bc
, disassembled to ...optimized.ll
link; Function Attrs: nofree norecurse nosync nounwind
define internal noundef i32 @matmul_dynamic_dispatch_3_mmt4d_DxDxDx16x16x1_f32(ptr noalias nocapture nonnull readonly align 16 %0, ptr noalias nocapture nonnull readonly align 16 %1, ptr noalias nocapture nonnull readonly align 16 %2) #1 !dbg !90 {
%.elt7 = getelementptr inbounds %iree_hal_executable_dispatch_state_v0_t.19, ptr %1, i64 0, i32 4, !dbg !91