We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent aa20318 commit 42aadedCopy full SHA for 42aaded
src/gpu/intel/jit/ir/send_plan.cpp
@@ -1302,6 +1302,11 @@ class view_info_t {
1302
if (type_size < slot_size * type_packing && slot_size < 4)
1303
slot_size = type_size;
1304
1305
+ // Require sub-byte types to fill a dword to avoid striding. This
1306
+ // restriction can be reduced to byte-alignment when the restriction
1307
+ // above is lifted.
1308
+ if (slot_size < 4 && type_packing > 1) gpu_error_not_expected();
1309
+
1310
// GPUs <= XeLP requires qword alignment for qword scattered messages,
1311
// downgrade to byte scattered (x1, x2 or x4) when alignment is
1312
// sub-qword.
0 commit comments