@@ -40,7 +40,6 @@ std::vector<Isolate> getIsolates(const std::string& isolates_unparsed);
40
40
std::vector<std::string> getNoFolds (::intel_npu::Config& cfg);
41
41
std::vector<std::string> getNoFolds (const std::string& nofolds_unparsed);
42
42
// Set default predefined values for COMPUTE pipeline
43
- void setComputeConfig (PassContext& ctx);
44
43
void dump_partitioning (const ov::npuw::Ensemble& ens, const std::string& to);
45
44
46
45
size_t getMinGraphSize (::intel_npu::Config& cfg) {
@@ -204,12 +203,6 @@ std::vector<std::string> getNoFolds(const std::string& nofolds_unparsed) {
204
203
return nofolds;
205
204
}
206
205
207
- void setComputeConfig (PassContext& ctx) {
208
- // FIXME: initialize via a dedicated function instead of parsing
209
- ctx.isolates = detail::getIsolates (ISOL_PRESETS.at (" COMPUTE" ));
210
- ctx.nofolds = detail::getNoFolds (" compute" );
211
- }
212
-
213
206
void dump_partitioning (const ov::npuw::Ensemble& ens, const std::string& to) {
214
207
pugi::xml_document doc;
215
208
@@ -277,10 +270,21 @@ class Compiler {
277
270
NONE, // Partitioning will consist of a single group with all the Ops
278
271
INIT, // Initialize only. The hardest mode, every group has just 1 layer inside
279
272
JUST, // "justParitioning" - combination of LHF + Remnants
280
- REP, // Repeated blocks pipeline - combination of repeatedBlocks and Remnants - default configuration
273
+ REP, // Repeated blocks pipeline - combination of repeatedBlocks and Remnants
274
+ REG, // Regularized repeated blocks pipeline -same as REP, but with some strong hints first
281
275
COMPUTE // Separates non-foldable compute subgraphs from the model based on predefined rules + REP
282
276
};
283
277
278
+ template <class C >
279
+ void warn_unused () {
280
+ const auto & val = m_cfg.get <C>();
281
+ if (val != C::defaultValue ()) {
282
+ LOG_WARN (" User-specified configuration {" << C::key () << " : " << val
283
+ << " } is ignored in the current pipeline "
284
+ << m_cfg.get <::intel_npu::NPUW_ONLINE_PIPELINE>());
285
+ }
286
+ }
287
+
284
288
Pipeline currentPipeline () {
285
289
std::string pipeline_opt = m_cfg.getString <::intel_npu::NPUW_ONLINE_PIPELINE>();
286
290
if (pipeline_opt == " NONE" ) {
@@ -291,6 +295,8 @@ class Compiler {
291
295
return Pipeline::JUST;
292
296
} else if (pipeline_opt == " REP" ) {
293
297
return Pipeline::REP;
298
+ } else if (pipeline_opt == " REG" ) {
299
+ return Pipeline::REG;
294
300
} else if (pipeline_opt == " COMPUTE" ) {
295
301
return Pipeline::COMPUTE;
296
302
} else {
@@ -346,6 +352,23 @@ class Compiler {
346
352
LOG_INFO (" Done" );
347
353
}
348
354
355
+ void reg () {
356
+ LOG_INFO (" Online partitioning: compiling regularized repeated blocks pipeline..." );
357
+ LOG_BLOCK ();
358
+
359
+ m_snapshot->earlyAvoids ();
360
+ m_snapshot->earlyRegroup ();
361
+ m_snapshot->repeatedBlocks ([&]() {
362
+ // This callback is called when repeatingBlocks algorithm thinks it is done
363
+ m_snapshot->stripTag (" compute" );
364
+ });
365
+ m_snapshot->repeat ([&] {
366
+ m_snapshot->fuseRemnantsExtended ();
367
+ });
368
+
369
+ LOG_INFO (" Done" );
370
+ }
371
+
349
372
public:
350
373
Compiler (const std::shared_ptr<ov::Model>& model, ::intel_npu::Config& cfg)
351
374
: m_model(model),
@@ -384,9 +407,24 @@ class Compiler {
384
407
case Pipeline::REP:
385
408
rep ();
386
409
break ;
410
+ case Pipeline::REG:
411
+ warn_unused<::intel_npu::NPUW_ONLINE_ISOLATE>();
412
+
413
+ // Only get isolates here.
414
+ // NB: We ignore NO_FOLD everywhere except pipeline COMPUTE - this needs
415
+ // to be aligned in the future
416
+ ctx.isolates = detail::getIsolates (detail::ISOL_PRESETS.at (" COMPUTE" ));
417
+ m_snapshot->setCtx (ctx);
418
+ reg ();
419
+ break ;
387
420
case Pipeline::COMPUTE:
421
+ warn_unused<::intel_npu::NPUW_ONLINE_ISOLATE>();
422
+ warn_unused<::intel_npu::NPUW_ONLINE_NO_FOLD>();
423
+
388
424
// Manually set predefined isolates and nofolds then do rep() pipeline
389
- detail::setComputeConfig (ctx);
425
+ // FIXME: initialize via a dedicated function instead of parsing
426
+ ctx.isolates = detail::getIsolates (detail::ISOL_PRESETS.at (" COMPUTE" ));
427
+ ctx.nofolds = detail::getNoFolds (" compute" );
390
428
m_snapshot->setCtx (ctx);
391
429
rep ();
392
430
break ;
0 commit comments