@@ -253,7 +253,6 @@ int make_input_tensors(std::vector<dnnl::graph::tensor> &input_ts,
253
253
}
254
254
255
255
// generate tensor for graph path
256
-
257
256
const auto iter = partition_mem_map.find (lt_id);
258
257
if (iter != partition_mem_map.end ()) {
259
258
const auto &graph_mem = iter->second ;
@@ -663,10 +662,16 @@ int doit(const prb_t *prb, res_t *res) {
663
662
std::vector<dnnl::graph::tensor> output_ts (outputs.size ());
664
663
665
664
ref_partition_t ref_partition (dg, partitions[i], inputs, outputs);
666
- // Construct memory for both perf & corr modes
667
- SAFE (ref_partition.init_ref (
668
- graph_in_ports, partition_mem_map_v[i], res),
669
- WARN);
665
+
666
+ if (!has_bench_mode_modifier (mode_modifier_t ::no_ref_memory)) {
667
+ // Construct memory for both perf & corr modes
668
+ SAFE (ref_partition.init_ref (
669
+ graph_in_ports, partition_mem_map_v[i], res),
670
+ WARN);
671
+ if (res->state == SKIPPED) return OK;
672
+ }
673
+
674
+ SAFE (ref_partition.init_graph_mem (partition_mem_map_v[i], res), WARN);
670
675
if (res->state == SKIPPED) return OK;
671
676
672
677
if (has_bench_mode_bit (mode_bit_t ::corr)) {
@@ -682,15 +687,18 @@ int doit(const prb_t *prb, res_t *res) {
682
687
}
683
688
}
684
689
685
- // unmap memory from host to device
686
- map_unmap_partition_mem (partition_mem_map_v[i], inputs, UNMAP, res);
687
- map_unmap_partition_mem (partition_mem_map_v[i], outputs, UNMAP, res);
688
- if (res->state == FAIL) {
689
- BENCHDNN_PRINT (0 ,
690
- " FAIL: Fail to unmap memories to host for partition "
691
- " %zu.\n " ,
692
- i);
693
- return FAIL;
690
+ if (!has_bench_mode_modifier (mode_modifier_t ::no_ref_memory)) {
691
+ // unmap memory from host to device
692
+ map_unmap_partition_mem (partition_mem_map_v[i], inputs, UNMAP, res);
693
+ map_unmap_partition_mem (
694
+ partition_mem_map_v[i], outputs, UNMAP, res);
695
+ if (res->state == FAIL) {
696
+ BENCHDNN_PRINT (0 ,
697
+ " FAIL: Fail to unmap memories to host for partition "
698
+ " %zu.\n " ,
699
+ i);
700
+ return FAIL;
701
+ }
694
702
}
695
703
696
704
const op_ref_list_t &op_list = ref_partition.get_partition_ops ();
@@ -730,9 +738,18 @@ int doit(const prb_t *prb, res_t *res) {
730
738
DNN_GRAPH_SAFE (strm.wait (), WARN, res);
731
739
graph_mem_mgr.stop_graph_mem_check ();
732
740
733
- // map memory from device back to host
734
- map_unmap_partition_mem (partition_mem_map_v[i], inputs, MAP, res);
735
- map_unmap_partition_mem (partition_mem_map_v[i], outputs, MAP, res);
741
+ if (!has_bench_mode_modifier (mode_modifier_t ::no_ref_memory)) {
742
+ // map memory from device back to host
743
+ map_unmap_partition_mem (partition_mem_map_v[i], inputs, MAP, res);
744
+ map_unmap_partition_mem (partition_mem_map_v[i], outputs, MAP, res);
745
+ if (res->state == FAIL) {
746
+ BENCHDNN_PRINT (0 ,
747
+ " FAIL: Fail to map memories back to host for partition "
748
+ " %zu.\n " ,
749
+ i);
750
+ return FAIL;
751
+ }
752
+ }
736
753
737
754
// If the device is out-of-memory due to graph path execution, skip the
738
755
// case.
0 commit comments