fix(core): add GLM-4.7-Flash-8bit template with glm47_flash parser

electroheadfx · electroheadfx · commit 67d5ecfce9b8 · 2026-01-21T09:09:20.000+01:00
- Update version to 0.1.11 in README and script
- Add GLM-4.7-Flash-8bit option to template model selection menu
- Configure reasoning-parser as glm47_flash for GLM-4.7-Flash-8bit
- Update usage instructions with new template model information
- Reorder template choices for better organization
diff --git a/README.md b/README.md
@@ -9,7 +9,7 @@ MLX Hugging Face Manager
 by Laurent Marques
 ```
 
-**Version: 0.1.10**
+**Version: 0.1.11**
 
 A terminal-based LLM model manager for Apple Silicon Macs. Browse, install, and run MLX-optimized models from Hugging Face with an intuitive TUI interface.
 
@@ -89,15 +89,44 @@ brew install huggingface-cli
 - Python 3.11 or 3.12 (Python 3.13+ is not yet supported)
 - Use pyenv to manage Python versions if needed
 
-#### Installation Method 1: Using pipx (Recommended)
+#### Installation Method 1: Using uv (Recommended)
 
 ```bash
-# Install mlx-openai-server
-pipx install mlx-openai-server
+```bash
 
-# Update mlx-lm to latest version for newest model support (e.g., iquestcoder)
-pipx runpip mlx-openai-server uninstall mlx-lm -y
-pipx runpip mlx-openai-server install git+https://github.com/ml-explore/mlx-lm.git
+
+# Set your preferred Python version
+pyenv global 3.12.8
+
+cd ~/Scripts/mlx-tools
+
+# Clone the mlx-openai-server repository
+git clone https://github.com/cubist38/mlx-openai-server.git
+cd mlx-openai-server
+
+# Create virtual environment (will use your pyenv Python 3.12.8)
+uv venv
+
+# Activate the environment
+source .venv/bin/activate
+
+# Install in development mode
+uv pip install -e .
+
+# Install latest mlx-lm from GitHub if needed to update to last mlx-lm
+# uv pip install git+https://github.com/ml-explore/mlx-lm.git
+
+```
+Then
+> add in your zshrc
+```bash
+mlx-openai-server() {
+    local original_dir="$PWD"
+    cd ~/Scripts/mlx-tools/mlx-openai-server
+    source .venv/bin/activate
+    command mlx-openai-server "$@"
+    cd "$original_dir"
+}
 ```
 
 **Verify installation:**
@@ -349,6 +378,9 @@ $MODEL_DIR/                        # Selected path (External/Local/Legacy)
 - Added template models documentation with usage instructions
 - Improved main menu organization and discoverability
 
+**Fix (v0.1.11):**
+- Added **glm47_flash** to --reasoning-parser param from GLM-4.7-Flash-8bit template
+
 ## Keyboard Shortcuts
 
 | Key | Action |
diff --git a/src/efx-face-manager.sh b/src/efx-face-manager.sh
@@ -7,7 +7,7 @@
 # Uses gum for interactive selection
 # https://github.com/charmbracelet/gum
 
-VERSION="0.1.10"
+VERSION="0.1.11"
 
 clear
 
@@ -1276,12 +1276,23 @@ while true; do
             # Fast launch predefined template models
             template_choice=$(gum choose \
                 --header "Select a template model to run" \
-                "Qwen3-Coder-30B-A3B-Instruct-8bit" \
-                "NVIDIA-Nemotron-3-Nano-30B-A3B-MLX-8Bit" \
                 "GLM-4.7-Flash-8bit" \
+                "NVIDIA-Nemotron-3-Nano-30B-A3B-MLX-8Bit" \
+                "Qwen3-Coder-30B-A3B-Instruct-8bit" \
                 "✖ Back")
 
             case "$template_choice" in
+                "GLM-4.7-Flash-8bit")
+                    CMD_ARGS=("--model-path" "$MODEL_DIR/GLM-4.7-Flash-8bit")
+                    CMD_ARGS+=("--model-type" "lm")
+                    CMD_ARGS+=("--reasoning-parser" "glm47_flash")
+                    CMD_ARGS+=("--tool-call-parser" "glm4_moe")
+                    CMD_ARGS+=("--message-converter" "glm4_moe")
+                    CMD_ARGS+=("--debug")
+                    CMD_ARGS+=("--port" "8000")
+                    CMD_ARGS+=("--host" "0.0.0.0")
+                    confirm_and_launch
+                    ;;
                 "Qwen3-Coder-30B-A3B-Instruct-8bit")
                     CMD_ARGS=("--model-path" "$MODEL_DIR/Qwen3-Coder-30B-A3B-Instruct-8bit")
                     CMD_ARGS+=("--model-type" "lm")
@@ -1301,17 +1312,6 @@ while true; do
                     CMD_ARGS+=("--trust-remote-code")
                     confirm_and_launch
                     ;;
-                "GLM-4.7-Flash-8bit")
-                    CMD_ARGS=("--model-path" "$MODEL_DIR/GLM-4.7-Flash-8bit")
-                    CMD_ARGS+=("--model-type" "lm")
-                    CMD_ARGS+=("--reasoning-parser" "glm4_moe") # glm47_flash
-                    CMD_ARGS+=("--tool-call-parser" "glm4_moe")
-                    CMD_ARGS+=("--message-converter" "glm4_moe")
-                    CMD_ARGS+=("--debug")
-                    CMD_ARGS+=("--port" "8000")
-                    CMD_ARGS+=("--host" "0.0.0.0")
-                    confirm_and_launch
-                    ;;
             esac
             ;;