Skip to content

Commit 0ae3683

Browse files
authored
[GPU] Adjust usm_host memory usage for InferRequest tensors (#26896)
### Details: - Adjust usm_host memory usage for InferRequest tensors
1 parent 108bb73 commit 0ae3683

File tree

1 file changed

+6
-3
lines changed

1 file changed

+6
-3
lines changed

src/plugins/intel_gpu/src/plugin/sync_infer_request.cpp

+6-3
Original file line numberDiff line numberDiff line change
@@ -34,9 +34,12 @@ namespace {
3434
inline bool can_use_usm_host(const cldnn::engine& engine) {
3535
auto can_use_usm = engine.use_unified_shared_memory();
3636

37-
if (engine.get_device_info().gfx_ver.major == 12 && engine.get_device_info().gfx_ver.minor == 60) {
38-
// WA: Disable USM host memory for infer request`s tensors for PVC as
39-
// it has performance issues in case of host <-> device data transfers inside kernels
37+
const auto& device_info = engine.get_device_info();
38+
if ((device_info.gfx_ver.major == 12 && device_info.gfx_ver.minor == 60) ||
39+
(device_info.gfx_ver.major >= 20 && device_info.dev_type == cldnn::device_type::discrete_gpu)) {
40+
// WA: Disable USM host memory for infer request`s tensors for PVC and subsequent dGPUs, as kernel access
41+
// to system memory is slower than using an explicit memcpy (Host <-> Device) call with the copy engine
42+
// Driver tickets with additional details: 6155, 10054
4043
GPU_DEBUG_TRACE << "Do not use usm_host for performance issue" << std::endl;
4144
can_use_usm = false;
4245
}

0 commit comments

Comments
 (0)