Skip to content

Commit 09e32c1

Browse files
authored
Improving glslang -O1 passes (shader-slang#1926)
* #include an absolute path didn't work - because paths were taken to always be relative. * Improve passes used for -O1 option with glslang. * Set sourceManager when serializing container.
1 parent b2ad8e9 commit 09e32c1

File tree

2 files changed

+59
-16
lines changed

2 files changed

+59
-16
lines changed

source/slang-glslang/slang-glslang.cpp

+54-12
Original file line numberDiff line numberDiff line change
@@ -161,6 +161,17 @@ static void glslang_optimizeSPIRV(std::vector<unsigned int>& spirv, spv_target_e
161161

162162
spvtools::OptimizerOptions spvOptOptions;
163163

164+
// To compile some large shaders the default is not enough.
165+
// That although this limit is exceeded, the final optimized output is typically well
166+
// within the range.
167+
//
168+
// See kDefaultMaxIdBound for description of this limit.
169+
//
170+
// If a compilation produces a warning like
171+
// `0:0: ID overflow. Try running compact-ids.`
172+
// it might be fixable by raising the multiplier to a larger value.
173+
spvOptOptions.set_max_id_bound(kDefaultMaxIdBound * 4);
174+
164175
// TODO confirm which passes we want to invoke for each level
165176
switch (optimizationLevel)
166177
{
@@ -182,7 +193,47 @@ static void glslang_optimizeSPIRV(std::vector<unsigned int>& spirv, spv_target_e
182193
optimizer.RegisterPass(spvtools::CreateLocalAccessChainConvertPass());
183194
optimizer.RegisterPass(spvtools::CreateAggressiveDCEPass());
184195
}
185-
#endif
196+
#elif 1
197+
// 6Mb 27 secs (all passes up to 9)
198+
// 9Mb 25 secs (all passes up to 7)
199+
// 8Mb 15 secs (all passes) -(5,6,7)
200+
// 6Mb 15 secs (all passes) -(6,7)
201+
202+
// This list of passes takes the previous 'default optimization'
203+
// passes (as listed above) and tries to combine them in order with the 'new' passes below.
204+
// The issue with the passes below is that although it produces smaller SPIR-V fairly quickly
205+
// it can cause serious problem on some drivers.
206+
//
207+
// Across a wide range of compilations this produced SPIR-V that is less than half size of the
208+
// previous -O1 passes above.
209+
{
210+
optimizer.RegisterPass(spvtools::CreateWrapOpKillPass()); // 1
211+
optimizer.RegisterPass(spvtools::CreateDeadBranchElimPass()); // 2
212+
213+
optimizer.RegisterPass(spvtools::CreateMergeReturnPass());
214+
optimizer.RegisterPass(spvtools::CreateInlineExhaustivePass());
215+
216+
optimizer.RegisterPass(spvtools::CreateEliminateDeadFunctionsPass()); // 3
217+
218+
optimizer.RegisterPass(spvtools::CreateAggressiveDCEPass());
219+
optimizer.RegisterPass(spvtools::CreatePrivateToLocalPass());
220+
221+
optimizer.RegisterPass(spvtools::CreateScalarReplacementPass(100));
222+
223+
optimizer.RegisterPass(spvtools::CreateCCPPass()); // 4 *
224+
optimizer.RegisterPass(spvtools::CreateSimplificationPass()); // 5
225+
//optimizer.RegisterPass(spvtools::CreateIfConversionPass()); // 6
226+
//optimizer.RegisterPass(spvtools::CreateBlockMergePass()); // 7 *
227+
228+
optimizer.RegisterPass(spvtools::CreateLocalAccessChainConvertPass());
229+
230+
optimizer.RegisterPass(spvtools::CreateLocalSingleBlockLoadStoreElimPass()); // 8
231+
232+
optimizer.RegisterPass(spvtools::CreateAggressiveDCEPass());
233+
234+
optimizer.RegisterPass(spvtools::CreateVectorDCEPass()); // 9
235+
}
236+
#else
186237
// The following selection of passes was created by
187238
// 1) Taking the list of passes from optimizer.RegisterSizePasses
188239
// 2) Disable/enable passes to try to produce some reasonable combination of low SPIR-V output size and compilation speed
@@ -242,6 +293,7 @@ static void glslang_optimizeSPIRV(std::vector<unsigned int>& spirv, spv_target_e
242293
optimizer.RegisterPass(spvtools::CreateAggressiveDCEPass());
243294
optimizer.RegisterPass(spvtools::CreateCFGCleanupPass());
244295
}
296+
#endif
245297

246298
break;
247299
case SLANG_OPTIMIZATION_LEVEL_HIGH:
@@ -256,17 +308,7 @@ static void glslang_optimizeSPIRV(std::vector<unsigned int>& spirv, spv_target_e
256308
// Use the same passes when specifying the "-O" flag in spirv-opt
257309
// Roughly equivalent to `RegisterPerformancePasses`
258310

259-
// To compile some large shaders the default is not enough.
260-
// That although this limit is exceeded, the final optimized output is typically well
261-
// within the range.
262-
//
263-
// See kDefaultMaxIdBound for description of this limit.
264-
//
265-
// If a compilation produces a warning like
266-
// `0:0: ID overflow. Try running compact-ids.`
267-
// it might be fixable by raising the multiplier to a larger value.
268-
spvOptOptions.set_max_id_bound(kDefaultMaxIdBound * 4);
269-
311+
270312
optimizer.RegisterPass(spvtools::CreateWrapOpKillPass());
271313
optimizer.RegisterPass(spvtools::CreateDeadBranchElimPass());
272314
optimizer.RegisterPass(spvtools::CreateMergeReturnPass());

source/slang/slang-compiler.cpp

+5-4
Original file line numberDiff line numberDiff line change
@@ -2094,17 +2094,18 @@ namespace Slang
20942094
SerialContainerUtil::WriteOptions options;
20952095

20962096
options.compressionType = linkage->serialCompressionType;
2097-
if (linkage->debugInfoLevel != DebugInfoLevel::None)
2098-
{
2099-
options.optionFlags |= SerialOptionFlag::SourceLocation;
2100-
}
21012097
if (linkage->m_obfuscateCode)
21022098
{
21032099
// If code is obfuscated, we *disable* AST output as it is not obfuscated and will reveal
21042100
// too much about IR.
21052101
// Also currently only IR is needed.
21062102
options.optionFlags &= ~SerialOptionFlag::ASTModule;
21072103
}
2104+
else if (linkage->debugInfoLevel != DebugInfoLevel::None && linkage->getSourceManager())
2105+
{
2106+
options.optionFlags |= SerialOptionFlag::SourceLocation;
2107+
options.sourceManager = linkage->getSourceManager();
2108+
}
21082109

21092110
{
21102111
RiffContainer container;

0 commit comments

Comments
 (0)