From 84a6b2229ffc608b1c3b6f1683fb8079d8473d62 Mon Sep 17 00:00:00 2001 From: Chili Palmer Date: Sat, 21 Mar 2026 16:08:40 +0100 Subject: [PATCH] added new story model with 12B size --- AGENTS.md | 1 + MLXServer/Models/ModelConfig.swift | 10 ++++++++++ README.md | 1 + 3 files changed, 12 insertions(+) diff --git a/AGENTS.md b/AGENTS.md index d161350..946c752 100644 --- a/AGENTS.md +++ b/AGENTS.md @@ -55,6 +55,7 @@ open "build/Debug/MLX Server.app" | `qwen` | `mlx-community/Qwen3.5-4B-MLX-4bit` | Vision + thinking mode + tool use via `` tags (256k context) | | `qwen3.5-0.8b` | `mlx-community/Qwen3.5-0.8B-4bit` | Vision + thinking mode + tool use via `` tags (256k context) | | `qwen3.5-9b` | `mlx-community/Qwen3.5-9B-4bit` | Vision + thinking mode + tool use via `` tags (256k context) | +| `violet-lotus` | `hobaratio/MN-Violet-Lotus-12B-mlx-4Bit` | Text-only Mistral-based model (32k context) | Any model in MLX format on HuggingFace can be added — no restriction on uploader or architecture. diff --git a/MLXServer/Models/ModelConfig.swift b/MLXServer/Models/ModelConfig.swift index 841c1e9..49da622 100644 --- a/MLXServer/Models/ModelConfig.swift +++ b/MLXServer/Models/ModelConfig.swift @@ -69,6 +69,16 @@ struct ModelConfig: Identifiable, Hashable { supportsTools: false, defaultGenerationSettings: .roleplayDefault ), + ModelConfig( + id: "violet-lotus", + repoId: "hobaratio/MN-Violet-Lotus-12B-mlx-4Bit", + displayName: "Violet Lotus 12B", + contextLength: 32_768, + loaderKind: .llm, + supportsImages: false, + supportsTools: false, + defaultGenerationSettings: .roleplayDefault + ), ] static let `default` = availableModels[0] diff --git a/README.md b/README.md index 6186ab6..2cf06ed 100644 --- a/README.md +++ b/README.md @@ -11,6 +11,7 @@ Native macOS app for running local LLMs on Apple Silicon via [MLX](https://githu | `qwen3.5-0.8b` | `mlx-community/Qwen3.5-0.8B-4bit` | 256k | `VLMModelFactory` | Vision, thinking mode, tool use (`` tags) | | `qwen3.5-9b` | `mlx-community/Qwen3.5-9B-4bit` | 256k | `VLMModelFactory` | Vision, thinking mode, tool use (`` tags) | | `stheno` | `synk/L3-8B-Stheno-v3.2-MLX` | 8k | `LLMModelFactory` | Text-only, llama-based | +| `violet-lotus` | `hobaratio/MN-Violet-Lotus-12B-mlx-4Bit` | 32k | `LLMModelFactory` | Text-only, Mistral-based | Any model in MLX format on HuggingFace can be added — there is no restriction on uploader or architecture.