Skip to content

Commit

Permalink
Merge 2643edc into d01fb23
Browse files Browse the repository at this point in the history
  • Loading branch information
hanhanW committed Jun 20, 2024
2 parents d01fb23 + 2643edc commit 40f6a3a
Showing 1 changed file with 4 additions and 7 deletions.
11 changes: 4 additions & 7 deletions compiler/src/iree/compiler/Codegen/LLVMCPU/Passes.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -498,12 +498,6 @@ void addMmt4dTilingExpertPassPipeline(OpPassManager &funcPassManager,
LLVMCPUPipelineOptions &pipelineOpt) {
addTileAndDistributePasses(funcPassManager);

if (pipelineOpt.enableUkernels) {
funcPassManager.addPass(createCPUPrepareUkernelsPass());
funcPassManager.addPass(
createCPULowerToUKernelsPass(clSkipIntermediateRoundings));
}

// We still run codegen pipeline because we want a better fallback when
// ukernels are not available. They are nop if the mmt4d op is convereted to
// ukernels. If ukernels are not implemented, the lowering config is still
Expand Down Expand Up @@ -531,11 +525,14 @@ void addMmt4dTilingExpertPassPipeline(OpPassManager &funcPassManager,
funcPassManager.addPass(createLLVMCPUTilePass(i));
continue;
}

funcPassManager.addPass(createLLVMCPUTilePass(i));
}
}

funcPassManager.addPass(createCPUPrepareUkernelsPass());
funcPassManager.addPass(
createCPULowerToUKernelsPass(clSkipIntermediateRoundings));

{
GenericVectorizationPassOptions options;
options.enableVectorMasking = pipelineOpt.enableVectorMasking;
Expand Down

0 comments on commit 40f6a3a

Please sign in to comment.