We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent 3fffa55 commit 506ef2dCopy full SHA for 506ef2d
1 file changed
transformer_engine/pytorch/module/grouped_linear.py
@@ -599,11 +599,8 @@ def forward(
599
600
if fp8_calibration:
601
for i in range(num_gemms):
602
- # amax of input
603
- for i in range(num_gemms):
604
- input_quantizers[i].calibrate(inputmats[i])
605
606
- weight_quantizers[i].calibrate(weights[i])
+ input_quantizers[i].calibrate(inputmats[i])
+ weight_quantizers[i].calibrate(weights[i])
607
608
if cpu_offloading:
609
mark_not_offload(*weights_fp8, *weights)
0 commit comments