Skip to content

Commit f5729fa

Browse files
xe: jit: gemm: fix bf16 scale handling
1 parent 42be8d5 commit f5729fa

File tree

1 file changed

+2
-1
lines changed

1 file changed

+2
-1
lines changed

src/gpu/intel/jit/gemm/generator/pieces/quantization.cxx

+2-1
Original file line numberDiff line numberDiff line change
@@ -320,13 +320,14 @@ void BLASKernelGenerator<hw>::gemmDequantizeOperation(bool doA, Type T, Type To,
320320
ne = std::min(ne, xqGroupMN - (l0 % xqGroupMN));
321321
} else if (colMajor == doA) {
322322
ne = std::min(ne, neq);
323-
if (qblock->crosspack * To != crosspack * T) stub();
323+
if (qblock->crosspack * To < crosspack * T) stub();
324324
} else {
325325
ne = std::min(ne, xqGroupK);
326326
strideq = 0;
327327
}
328328

329329
int maxSIMD = (op == BinaryOp::Sub && T.isInt8()) ? 64 : 32;
330+
if(To == Type::f32) maxSIMD = 16;
330331
int simd = std::min({ne * crosspack / strided, 2 * elementsPerGRF(hw, T) / strided, maxSIMD});
331332
switch (op) {
332333
case BinaryOp::Sub:

0 commit comments

Comments
 (0)