We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 01c30f6 commit 3a31c57Copy full SHA for 3a31c57
fastdeploy/model_executor/layers/quantization/weight_only.py
@@ -237,6 +237,8 @@ def __init__(
237
def create_weights(self, layer, **extra_weight_attrs):
238
# TODO(bukejiyu): remove v1 loader check when v0 loader is removed
239
self.model_format = extra_weight_attrs.get("model_format")
240
+ if "split_axis" in extra_weight_attrs and hasattr(layer, "nranks") and layer.nranks > 0:
241
+ extra_weight_attrs = {**extra_weight_attrs, "is_distributed": True}
242
if self.quant_config.is_checkpoint_bf16 and layer.fd_config.load_config.load_choices == "default_v1":
243
weight_shape = layer.weight_shape[::-1] if self.model_format == "torch" else layer.weight_shape
244
layer.weight = layer.create_parameter(
0 commit comments