diff --git a/fbgemm_gpu/experimental/gen_ai/bench/quantize_ops.py b/fbgemm_gpu/experimental/gen_ai/bench/quantize_ops.py index c2817c2b8..d53a2c7ff 100644 --- a/fbgemm_gpu/experimental/gen_ai/bench/quantize_ops.py +++ b/fbgemm_gpu/experimental/gen_ai/bench/quantize_ops.py @@ -165,7 +165,7 @@ def quantize(self, x, w): return xq, wq, x_scale, w_scale def compute(self, xq, wq, x_scale, w_scale): - output, _ = torch._scaled_mm( + output = torch._scaled_mm( xq, wq, bias=None,