diff --git a/config.example.yaml b/config.example.yaml index 381bd0cf..5e1c7687 100644 --- a/config.example.yaml +++ b/config.example.yaml @@ -169,6 +169,13 @@ models: # - processes have 5 seconds to shutdown until forceful termination is attempted cmdStop: docker stop ${MODEL_ID} + # mlx_lm.server example: + "mlx-community/Qwen3-Next-80B-A3B-Thinking-4bit": + cmd: | + mlx_lm.server --port ${PORT} + --model /models/mlx-community/Qwen3-Next-80B-A3B-Thinking-4bit + useModelName: "/models/mlx-community/Qwen3-Next-80B-A3B-Thinking-4bit" + # groups: a dictionary of group settings # - optional, default: empty dictionary # - provides advanced controls over model swapping behaviour @@ -246,4 +253,4 @@ hooks: # - when preloading multiple models at once, define a group # otherwise models will be loaded and swapped out preload: - - "llama" \ No newline at end of file + - "llama"