Skip to content

Commit

Permalink
This is a temporary solution in order to transition to system provide…
Browse files Browse the repository at this point in the history
…d LLVM releases. Since we will not anymore patch LLVM sources, we need to customize some LLVM passes for the desired behavior.

InstCombiner, by default, performs instruction sinking while doing combining. This causes multiple negative effects (breaking I/O coalesicng, increasing register pressure). the solution so far was to apply a patch to LLVM code base to disable this.

Since we do not use patches on LLVM anymore, we copy over the pass into IGC codebase and customize it.

A discussion is undergoing to include some of those customizations into LLVM trunk, nevertheless that would happen after LLVM 7.0 transition.
At that point, this checkin should be removed to keep the design clean.

Change-Id: I14cc6870ec046a85ccd721f92435ded1d98df1f8
  • Loading branch information
ktrifunovic authored and gfxbot committed Nov 2, 2018
1 parent 432c310 commit 25753bb
Show file tree
Hide file tree
Showing 21 changed files with 28,956 additions and 73 deletions.
7 changes: 5 additions & 2 deletions IGC/AdaptorOCL/UnifyIROCL.cpp
Expand Up @@ -104,6 +104,8 @@ SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
#include "Compiler/MetaDataUtilsWrapper.h"
#include "Compiler/SPIRMetaDataTranslation.h"
#include "Compiler/Optimizer/OpenCLPasses/ErrorCheckPass.h"


#include "Compiler/MetaDataApi/IGCMetaDataDefs.h"
#include "Compiler/MetaDataApi/IGCMetaDataHelper.h"
#include "Compiler/CodeGenContextWrapper.hpp"
Expand All @@ -112,6 +114,7 @@ SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
#include "Compiler/MetaDataApi/SpirMetaDataApi.h"
#include "Compiler/Optimizer/FixFastMathFlags.hpp"
#include "MoveStaticAllocas.h"
#include "Compiler/Optimizer/IGCInstCombiner/4.0/IGCInstructionCombining.hpp"

#include "common/debug/Debug.hpp"
#include "common/igc_regkeys.hpp"
Expand Down Expand Up @@ -397,7 +400,7 @@ static void CommonOCLBasedPasses(
mpm.add(createSimplifyConstantPass());
mpm.add(createPromoteConstantPass());
}
mpm.add(createInstructionCombiningPass());
mpm.add(createIGCInstructionCombiningPass());

// Instcombine can create constant expressions, which are not handled by the program scope constant resolution pass
mpm.add(new BreakConstantExpr());
Expand All @@ -415,7 +418,7 @@ static void CommonOCLBasedPasses(

// TODO: Run CheckInstrTypes after builtin import to determine if builtins have allocas.
mpm.add(createSROAPass());
mpm.add(createInstructionCombiningPass());
mpm.add(createIGCInstructionCombiningPass());

// "false" to createScalarizerPass() means that vector load/stores are NOT scalarized
mpm.add(createScalarizerPass(false));
Expand Down
12 changes: 7 additions & 5 deletions IGC/Compiler/CISACodeGen/ShaderCodeGen.cpp
Expand Up @@ -157,6 +157,7 @@ SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
#include "Compiler/Optimizer/SetMathPrecisionForPositionOutput.hpp"
#include "Compiler/DebugInfo/VISADebugEmitter.hpp"
#include "Compiler/SampleCmpToDiscard.h"
#include "Compiler/Optimizer/IGCInstCombiner/4.0/IGCInstructionCombining.hpp"

#include "DebugInfo.hpp"

Expand Down Expand Up @@ -489,7 +490,7 @@ inline void AddLegalizationPasses(CodeGenContext &ctx, const CShaderProgram::Ker
if (IGC_IS_FLAG_ENABLED(EnableAdvMemOpt))
mpm.add(createAdvMemOptPass());
mpm.add(createMemOptPass());
mpm.add(llvm::createInstructionCombiningPass());
mpm.add(createIGCInstructionCombiningPass());
}

if (!isOptDisabled &&
Expand Down Expand Up @@ -535,7 +536,7 @@ inline void AddLegalizationPasses(CodeGenContext &ctx, const CShaderProgram::Ker
// Optimize lower-level IR
if (!fastCompile)
{
mpm.add(createInstructionCombiningPass());
mpm.add(createIGCInstructionCombiningPass());
}
mpm.add(new GenSpecificPattern());
if (!fastCompile)
Expand Down Expand Up @@ -1179,7 +1180,7 @@ void OptimizeIR(CodeGenContext* pContext)
mpm.add(createGenFDIVEmulation());
}

mpm.add(llvm::createInstructionCombiningPass());
mpm.add(createIGCInstructionCombiningPass());
mpm.add(llvm::createDeadCodeEliminationPass()); // this should be done both before/after constant propagation

if (pContext->m_instrTypes.hasGenericAddressSpacePointers &&
Expand Down Expand Up @@ -1219,7 +1220,7 @@ void OptimizeIR(CodeGenContext* pContext)
mpm.add(new CustomLoopVersioning());
}

mpm.add(llvm::createInstructionCombiningPass());
mpm.add(createIGCInstructionCombiningPass());
if (IGC_IS_FLAG_ENABLED(EnableAdvCodeMotion) &&
pContext->type == ShaderType::OPENCL_SHADER &&
!pContext->m_instrTypes.hasSwitch)
Expand Down Expand Up @@ -1324,7 +1325,8 @@ void OptimizeIR(CodeGenContext* pContext)
mpm.add(llvm::createJumpThreadingPass());

// run instruction combining to clean up the code after CFG optimizations
mpm.add(createInstructionCombiningPass());
mpm.add(createIGCInstructionCombiningPass());

mpm.add(llvm::createDeadCodeEliminationPass());
mpm.add(llvm::createEarlyCSEPass());

Expand Down
4 changes: 3 additions & 1 deletion IGC/Compiler/InitializePasses.h
Expand Up @@ -114,7 +114,7 @@ void initializeWIAnalysisPass(llvm::PassRegistry&);
void initializeWIFuncResolutionPass(llvm::PassRegistry&);
void initializeWIFuncsAnalysisPass(llvm::PassRegistry&);
void initializeWorkaroundAnalysisPass(llvm::PassRegistry&);
void initializeWAFMinFMaxPass(llvm::PassRegistry&);
void initializeWAFMinFMaxPass(llvm::PassRegistry&);
void initializePingPongTexturesAnalysisPass(llvm::PassRegistry&);
void initializePingPongTexturesOptPass(llvm::PassRegistry&);
void initializeLinkTessControlShaderPass(llvm::PassRegistry&);
Expand All @@ -135,3 +135,5 @@ void initializeCheckInstrTypesPass(llvm::PassRegistry&);
void initializeHalfPromotionPass(llvm::PassRegistry&);
void initializeFixFastMathFlagsPass(llvm::PassRegistry&);
void initializeCodeAssumptionPass(llvm::PassRegistry&);
void initializeIGCInstructionCombiningPassPass(llvm::PassRegistry&);

134 changes: 69 additions & 65 deletions IGC/Compiler/Optimizer/CMakeLists.txt
@@ -1,65 +1,69 @@
include_directories("${CMAKE_CURRENT_SOURCE_DIR}")

add_subdirectory(OpenCLPasses)
add_subdirectory(OpenGLPasses)

set(IGC_BUILD__SRC__Optimizer
"${CMAKE_CURRENT_SOURCE_DIR}/BuiltInFuncImport.cpp"
"${CMAKE_CURRENT_SOURCE_DIR}/InfiniteLoopRemoval.cpp"
"${CMAKE_CURRENT_SOURCE_DIR}/LinkMultiRateShaders.cpp"
"${CMAKE_CURRENT_SOURCE_DIR}/MCSOptimization.cpp"
"${CMAKE_CURRENT_SOURCE_DIR}/GatingSimilarSamples.cpp"
"${CMAKE_CURRENT_SOURCE_DIR}/OCLBIConverter.cpp"
"${CMAKE_CURRENT_SOURCE_DIR}/OCLBIUtils.cpp"
"${CMAKE_CURRENT_SOURCE_DIR}/PreCompiledFuncImport.cpp"
"${CMAKE_CURRENT_SOURCE_DIR}/PreCompiledFuncLibrary.cpp"
"${CMAKE_CURRENT_SOURCE_DIR}/Scalarizer.cpp"
"${CMAKE_CURRENT_SOURCE_DIR}/SetMathPrecisionForPositionOutput.cpp"
"${CMAKE_CURRENT_SOURCE_DIR}/FixFastMathFlags.cpp"
"${CMAKE_CURRENT_SOURCE_DIR}/CodeAssumption.cpp"
"${CMAKE_CURRENT_SOURCE_DIR}/MarkReadOnlyLoad.cpp"
"${CMAKE_CURRENT_SOURCE_DIR}/RectListOptimizationPass.cpp"
)

set(IGC_BUILD__SRC__Compiler_Optimizer
${IGC_BUILD__SRC__Optimizer}
${IGC_BUILD__SRC__Optimizer_OpenCLPasses}
${IGC_BUILD__SRC__Optimizer_OpenGLPasses}
PARENT_SCOPE
)

set(IGC_BUILD__HDR__Optimizer
"${CMAKE_CURRENT_SOURCE_DIR}/BuiltInFuncImport.h"
"${CMAKE_CURRENT_SOURCE_DIR}/InfiniteLoopRemoval.hpp"
"${CMAKE_CURRENT_SOURCE_DIR}/LinkMultiRateShaders.hpp"
"${CMAKE_CURRENT_SOURCE_DIR}/OCLBIConverter.h"
"${CMAKE_CURRENT_SOURCE_DIR}/OCLBIUtils.h"
"${CMAKE_CURRENT_SOURCE_DIR}/MCSOptimization.hpp"
"${CMAKE_CURRENT_SOURCE_DIR}/GatingSimilarSamples.hpp"
"${CMAKE_CURRENT_SOURCE_DIR}/PreCompiledFuncImport.hpp"
"${CMAKE_CURRENT_SOURCE_DIR}/Scalarizer.h"
"${CMAKE_CURRENT_SOURCE_DIR}/SetMathPrecisionForPositionOutput.hpp"
"${CMAKE_CURRENT_SOURCE_DIR}/FixFastMathFlags.hpp"
"${CMAKE_CURRENT_SOURCE_DIR}/CodeAssumption.hpp"
"${CMAKE_CURRENT_SOURCE_DIR}/RectListOptimizationPass.hpp"
)


set(IGC_BUILD__HDR__Compiler_Optimizer
${IGC_BUILD__HDR__Optimizer}
${IGC_BUILD__HDR__Optimizer_OpenCLPasses}
${IGC_BUILD__HDR__Optimizer_OpenGLPasses}
PARENT_SCOPE
)


igc_sg_register(
Compiler__Optimizer
"Optimizer"
GROUPS
Compiler__Optimizer_OpenCLPasses
Compiler__Optimizer_OpenGLPasses
FILES
${IGC_BUILD__SRC__Optimizer}
${IGC_BUILD__HDR__Optimizer}
)
include_directories("${CMAKE_CURRENT_SOURCE_DIR}")

add_subdirectory(OpenCLPasses)
add_subdirectory(OpenGLPasses)
add_subdirectory(IGCInstCombiner)

set(IGC_BUILD__SRC__Optimizer
"${CMAKE_CURRENT_SOURCE_DIR}/BuiltInFuncImport.cpp"
"${CMAKE_CURRENT_SOURCE_DIR}/InfiniteLoopRemoval.cpp"
"${CMAKE_CURRENT_SOURCE_DIR}/LinkMultiRateShaders.cpp"
"${CMAKE_CURRENT_SOURCE_DIR}/MCSOptimization.cpp"
"${CMAKE_CURRENT_SOURCE_DIR}/GatingSimilarSamples.cpp"
"${CMAKE_CURRENT_SOURCE_DIR}/OCLBIConverter.cpp"
"${CMAKE_CURRENT_SOURCE_DIR}/OCLBIUtils.cpp"
"${CMAKE_CURRENT_SOURCE_DIR}/PreCompiledFuncImport.cpp"
"${CMAKE_CURRENT_SOURCE_DIR}/PreCompiledFuncLibrary.cpp"
"${CMAKE_CURRENT_SOURCE_DIR}/Scalarizer.cpp"
"${CMAKE_CURRENT_SOURCE_DIR}/SetMathPrecisionForPositionOutput.cpp"
"${CMAKE_CURRENT_SOURCE_DIR}/FixFastMathFlags.cpp"
"${CMAKE_CURRENT_SOURCE_DIR}/CodeAssumption.cpp"
"${CMAKE_CURRENT_SOURCE_DIR}/MarkReadOnlyLoad.cpp"
"${CMAKE_CURRENT_SOURCE_DIR}/RectListOptimizationPass.cpp"
)

set(IGC_BUILD__SRC__Compiler_Optimizer
${IGC_BUILD__SRC__Optimizer}
${IGC_BUILD__SRC__Optimizer_OpenCLPasses}
${IGC_BUILD__SRC__Optimizer_OpenGLPasses}
${IGC_BUILD__SRC__Optimizer_IGCInstCombiner}
PARENT_SCOPE
)

set(IGC_BUILD__HDR__Optimizer
"${CMAKE_CURRENT_SOURCE_DIR}/BuiltInFuncImport.h"
"${CMAKE_CURRENT_SOURCE_DIR}/InfiniteLoopRemoval.hpp"
"${CMAKE_CURRENT_SOURCE_DIR}/LinkMultiRateShaders.hpp"
"${CMAKE_CURRENT_SOURCE_DIR}/OCLBIConverter.h"
"${CMAKE_CURRENT_SOURCE_DIR}/OCLBIUtils.h"
"${CMAKE_CURRENT_SOURCE_DIR}/MCSOptimization.hpp"
"${CMAKE_CURRENT_SOURCE_DIR}/GatingSimilarSamples.hpp"
"${CMAKE_CURRENT_SOURCE_DIR}/PreCompiledFuncImport.hpp"
"${CMAKE_CURRENT_SOURCE_DIR}/Scalarizer.h"
"${CMAKE_CURRENT_SOURCE_DIR}/SetMathPrecisionForPositionOutput.hpp"
"${CMAKE_CURRENT_SOURCE_DIR}/FixFastMathFlags.hpp"
"${CMAKE_CURRENT_SOURCE_DIR}/CodeAssumption.hpp"
"${CMAKE_CURRENT_SOURCE_DIR}/RectListOptimizationPass.hpp"
)


set(IGC_BUILD__HDR__Compiler_Optimizer
${IGC_BUILD__HDR__Optimizer}
${IGC_BUILD__HDR__Optimizer_OpenCLPasses}
${IGC_BUILD__HDR__Optimizer_OpenGLPasses}
${IGC_BUILD__HDR__Optimizer_IGCInstCombiner}
PARENT_SCOPE
)


igc_sg_register(
Compiler__Optimizer
"Optimizer"
GROUPS
Compiler__Optimizer_OpenCLPasses
Compiler__Optimizer_OpenGLPasses
Compiler__Optimizer_IGCInstCombiner
FILES
${IGC_BUILD__SRC__Optimizer}
${IGC_BUILD__HDR__Optimizer}
)
34 changes: 34 additions & 0 deletions IGC/Compiler/Optimizer/IGCInstCombiner/4.0/CMakeLists.txt
@@ -0,0 +1,34 @@
include_directories("${CMAKE_CURRENT_SOURCE_DIR}")


set(IGC_BUILD__SRC__4_0
"${CMAKE_CURRENT_SOURCE_DIR}/InstCombineAddSub.cpp"
"${CMAKE_CURRENT_SOURCE_DIR}/InstCombineAndOrXor.cpp"
"${CMAKE_CURRENT_SOURCE_DIR}/InstCombineCalls.cpp"
"${CMAKE_CURRENT_SOURCE_DIR}/InstCombineCasts.cpp"
"${CMAKE_CURRENT_SOURCE_DIR}/InstCombineCompares.cpp"
"${CMAKE_CURRENT_SOURCE_DIR}/InstCombineLoadStoreAlloca.cpp"
"${CMAKE_CURRENT_SOURCE_DIR}/InstCombineMulDivRem.cpp"
"${CMAKE_CURRENT_SOURCE_DIR}/InstCombinePHI.cpp"
"${CMAKE_CURRENT_SOURCE_DIR}/InstCombineSelect.cpp"
"${CMAKE_CURRENT_SOURCE_DIR}/InstCombineShifts.cpp"
"${CMAKE_CURRENT_SOURCE_DIR}/InstCombineSimplifyDemanded.cpp"
"${CMAKE_CURRENT_SOURCE_DIR}/InstCombineVectorOps.cpp"
"${CMAKE_CURRENT_SOURCE_DIR}/InstructionCombining.cpp"
)
set(IGC_BUILD__SRC__IGCInstCombiner_4_0 ${IGC_BUILD__SRC__4_0} PARENT_SCOPE)

set(IGC_BUILD__HDR__4_0
"${CMAKE_CURRENT_SOURCE_DIR}/InstCombineInternal.h"
"${CMAKE_CURRENT_SOURCE_DIR}/IGCInstructionCombining.hpp"
)
set(IGC_BUILD__HDR__IGCInstCombiner_4_0 ${IGC_BUILD__HDR__4_0} PARENT_SCOPE)


igc_sg_register(
Optimizer__IGCInstCombiner_4_0
"4.0"
FILES
${IGC_BUILD__SRC__4_0}
${IGC_BUILD__HDR__4_0}
)
@@ -0,0 +1,62 @@
/*===================== begin_copyright_notice ==================================
Copyright (c) 2017 Intel Corporation
Permission is hereby granted, free of charge, to any person obtaining a
copy of this software and associated documentation files (the
"Software"), to deal in the Software without restriction, including
without limitation the rights to use, copy, modify, merge, publish,
distribute, sublicense, and/or sell copies of the Software, and to
permit persons to whom the Software is furnished to do so, subject to
the following conditions:
The above copyright notice and this permission notice shall be included
in all copies or substantial portions of the Software.
THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.
IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY
CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
======================= end_copyright_notice ==================================*/
#ifndef IGC_INSTCOMBINE_INSTCOMBINE_H
#define IGC_INSTCOMBINE_INSTCOMBINE_H

#include <llvm/PassRegistry.h>
#include "llvm/Transforms/InstCombine/InstCombineWorklist.h"
#include "llvm/IR/PassManager.h"

#include "Compiler/InitializePasses.h"

namespace llvm {
class FunctionPass;
}

namespace IGC
{
class IGCInstructionCombiningPass : public llvm::FunctionPass {
llvm::InstCombineWorklist Worklist;
const bool ExpensiveCombines;

public:
static char ID; // Pass identification, replacement for typeid

IGCInstructionCombiningPass(bool ExpensiveCombines = true)
: FunctionPass(ID), ExpensiveCombines(ExpensiveCombines) {
initializeIGCInstructionCombiningPassPass(*llvm::PassRegistry::getPassRegistry());
}

void getAnalysisUsage(llvm::AnalysisUsage &AU) const override;
bool runOnFunction(llvm::Function &F) override;
};


llvm::FunctionPass* createIGCInstructionCombiningPass();
} // namespace IGC

#endif //IGC_INSTCOMBINE_INSTCOMBINE_H

0 comments on commit 25753bb

Please sign in to comment.