From 31aec6276118c07ed605f5961d7b264e69f68f99 Mon Sep 17 00:00:00 2001 From: Mateusz Klimaszewski Date: Wed, 17 Sep 2025 13:50:54 +0200 Subject: [PATCH 1/2] Make parameters config optional in RawPyTorchMergeConfig. --- mergekit/scripts/merge_raw_pytorch.py | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/mergekit/scripts/merge_raw_pytorch.py b/mergekit/scripts/merge_raw_pytorch.py index 37a4f92b..8da0f0a2 100644 --- a/mergekit/scripts/merge_raw_pytorch.py +++ b/mergekit/scripts/merge_raw_pytorch.py @@ -28,8 +28,8 @@ class InputModelDefinition(BaseModel, frozen=True): class RawPyTorchMergeConfig(BaseModel, frozen=True): merge_method: str - parameters: Optional[Dict[str, ParameterSetting]] models: List[InputModelDefinition] + parameters: Optional[Dict[str, ParameterSetting]] = None dtype: Optional[str] = None base_model: Optional[str] = None @@ -169,7 +169,7 @@ def construct_param_dicts( ): global_params = {} for param_def in merge_method.parameters(): - if param_def.name in config.parameters: + if config.parameters and param_def.name in config.parameters: value = evaluate_setting(tensor_name, config.parameters[param_def.name]) if value is not None: global_params[param_def.name] = value From 29206a40b8b39fd21c65c07418ff727958457192 Mon Sep 17 00:00:00 2001 From: Mateusz Klimaszewski Date: Wed, 17 Sep 2025 14:44:22 +0200 Subject: [PATCH 2/2] Add check if config.parameters is null. --- mergekit/scripts/merge_raw_pytorch.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/mergekit/scripts/merge_raw_pytorch.py b/mergekit/scripts/merge_raw_pytorch.py index 8da0f0a2..a9bdcb12 100644 --- a/mergekit/scripts/merge_raw_pytorch.py +++ b/mergekit/scripts/merge_raw_pytorch.py @@ -192,7 +192,7 @@ def construct_param_dicts( ): tensor_params[mr][param_def.name] = value elif value := evaluate_setting( - tensor_name, config.parameters.get(param_def.name, []) + tensor_name, config.parameters.get(param_def.name, []) if config.parameters else [] ): tensor_params[mr][param_def.name] = value elif param_def.required: