@@ -32,15 +32,45 @@ object ModelList {
3232 AppModel (id = " qwen2.5-0.5b-instruct-q6_k" , name = " Qwen 2.5 0.5B Instruct Q6_K" ,
3333 url = " https://huggingface.co/Triangle104/Qwen2.5-0.5B-Instruct-Q6_K-GGUF/resolve/main/qwen2.5-0.5b-instruct-q6_k.gguf" ,
3434 framework = InferenceFramework .LLAMA_CPP , category = ModelCategory .LANGUAGE ,
35+ memoryRequirement = 600_000_000 , supportsLoraAdapters = true ),
36+ AppModel (id = " qwen2.5-1.5b-instruct-q4_k_m" , name = " Qwen 2.5 1.5B Instruct Q4_K_M" ,
37+ url = " https://huggingface.co/Qwen/Qwen2.5-1.5B-Instruct-GGUF/resolve/main/qwen2.5-1.5b-instruct-q4_k_m.gguf" ,
38+ framework = InferenceFramework .LLAMA_CPP , category = ModelCategory .LANGUAGE ,
39+ memoryRequirement = 2_500_000_000 ),
40+ // Qwen3 models
41+ AppModel (id = " qwen3-0.6b-q4_k_m" , name = " Qwen3 0.6B Q4_K_M" ,
42+ url = " https://huggingface.co/unsloth/Qwen3-0.6B-GGUF/resolve/main/Qwen3-0.6B-Q4_K_M.gguf" ,
43+ framework = InferenceFramework .LLAMA_CPP , category = ModelCategory .LANGUAGE ,
44+ memoryRequirement = 500_000_000 ),
45+ AppModel (id = " qwen3-1.7b-q4_k_m" , name = " Qwen3 1.7B Q4_K_M" ,
46+ url = " https://huggingface.co/unsloth/Qwen3-1.7B-GGUF/resolve/main/Qwen3-1.7B-Q4_K_M.gguf" ,
47+ framework = InferenceFramework .LLAMA_CPP , category = ModelCategory .LANGUAGE ,
48+ memoryRequirement = 1_200_000_000 ),
49+ AppModel (id = " qwen3-4b-q4_k_m" , name = " Qwen3 4B Q4_K_M" ,
50+ url = " https://huggingface.co/unsloth/Qwen3-4B-GGUF/resolve/main/Qwen3-4B-Q4_K_M.gguf" ,
51+ framework = InferenceFramework .LLAMA_CPP , category = ModelCategory .LANGUAGE ,
52+ memoryRequirement = 2_800_000_000 ),
53+ // Qwen3.5 models
54+ AppModel (id = " qwen3.5-0.8b-q4_k_m" , name = " Qwen3.5 0.8B Q4_K_M" ,
55+ url = " https://huggingface.co/unsloth/Qwen3.5-0.8B-GGUF/resolve/main/Qwen3.5-0.8B-Q4_K_M.gguf" ,
56+ framework = InferenceFramework .LLAMA_CPP , category = ModelCategory .LANGUAGE ,
3557 memoryRequirement = 600_000_000 ),
58+ AppModel (id = " qwen3.5-2b-q4_k_m" , name = " Qwen3.5 2B Q4_K_M" ,
59+ url = " https://huggingface.co/unsloth/Qwen3.5-2B-GGUF/resolve/main/Qwen3.5-2B-Q4_K_M.gguf" ,
60+ framework = InferenceFramework .LLAMA_CPP , category = ModelCategory .LANGUAGE ,
61+ memoryRequirement = 1_500_000_000 ),
62+ AppModel (id = " qwen3.5-4b-q4_k_m" , name = " Qwen3.5 4B Q4_K_M" ,
63+ url = " https://huggingface.co/unsloth/Qwen3.5-4B-GGUF/resolve/main/Qwen3.5-4B-Q4_K_M.gguf" ,
64+ framework = InferenceFramework .LLAMA_CPP , category = ModelCategory .LANGUAGE ,
65+ memoryRequirement = 2_800_000_000 ),
3666 AppModel (id = " lfm2-350m-q4_k_m" , name = " LiquidAI LFM2 350M Q4_K_M" ,
3767 url = " https://huggingface.co/LiquidAI/LFM2-350M-GGUF/resolve/main/LFM2-350M-Q4_K_M.gguf" ,
3868 framework = InferenceFramework .LLAMA_CPP , category = ModelCategory .LANGUAGE ,
39- memoryRequirement = 250_000_000 , supportsLoraAdapters = true ),
69+ memoryRequirement = 250_000_000 ),
4070 AppModel (id = " lfm2-350m-q8_0" , name = " LiquidAI LFM2 350M Q8_0" ,
4171 url = " https://huggingface.co/LiquidAI/LFM2-350M-GGUF/resolve/main/LFM2-350M-Q8_0.gguf" ,
4272 framework = InferenceFramework .LLAMA_CPP , category = ModelCategory .LANGUAGE ,
43- memoryRequirement = 400_000_000 , supportsLoraAdapters = true ),
73+ memoryRequirement = 400_000_000 ),
4474 AppModel (id = " lfm2-1.2b-tool-q4_k_m" , name = " LiquidAI LFM2 1.2B Tool Q4_K_M" ,
4575 url = " https://huggingface.co/LiquidAI/LFM2-1.2B-Tool-GGUF/resolve/main/LFM2-1.2B-Tool-Q4_K_M.gguf" ,
4676 framework = InferenceFramework .LLAMA_CPP , category = ModelCategory .LANGUAGE ,
@@ -81,46 +111,46 @@ object ModelList {
81111 )),
82112 )
83113
84- // LoRA Adapters (from Void2377/Qwen on HuggingFace — real standalone LoRA GGUF files)
114+ // LoRA Adapters
85115 private val loraAdapters = listOf (
86116 LoraAdapterCatalogEntry (
87- id = " chat -assistant-lora" ,
88- name = " Chat Assistant" ,
89- description = " Enhances conversational chat ability " ,
90- downloadUrl = " https://huggingface.co/Void2377/Qwen/resolve/main/lora/chat_assistant-lora -Q8_0.gguf" ,
91- filename = " chat_assistant-lora -Q8_0.gguf" ,
92- compatibleModelIds = listOf (" lfm2-350m-q4_k_m " , " lfm2-350m-q8_0 " ),
93- fileSize = 690_176 ,
117+ id = " code -assistant-lora" ,
118+ name = " Code Assistant" ,
119+ description = " Enhances code generation and programming assistance " ,
120+ downloadUrl = " https://huggingface.co/Void2377/Qwen/resolve/main/lora/code-assistant -Q8_0.gguf" ,
121+ filename = " code-assistant -Q8_0.gguf" ,
122+ compatibleModelIds = listOf (" qwen2.5-0.5b-instruct-q6_k " ),
123+ fileSize = 765_952 ,
94124 defaultScale = 1.0f ,
95125 ),
96126 LoraAdapterCatalogEntry (
97- id = " summarizer -lora" ,
98- name = " Summarizer " ,
99- description = " Specialized for text summarization tasks " ,
100- downloadUrl = " https://huggingface.co/Void2377/Qwen/resolve/main/lora/summarizer-lora -Q8_0.gguf" ,
101- filename = " summarizer-lora -Q8_0.gguf" ,
102- compatibleModelIds = listOf (" lfm2-350m-q4_k_m " , " lfm2-350m-q8_0 " ),
103- fileSize = 690_176 ,
127+ id = " reasoning-logic -lora" ,
128+ name = " Reasoning Logic " ,
129+ description = " Improves logical reasoning and step-by-step problem solving " ,
130+ downloadUrl = " https://huggingface.co/Void2377/Qwen/resolve/main/lora/reasoning-logic -Q8_0.gguf" ,
131+ filename = " reasoning-logic -Q8_0.gguf" ,
132+ compatibleModelIds = listOf (" qwen2.5-0.5b-instruct-q6_k " ),
133+ fileSize = 765_952 ,
104134 defaultScale = 1.0f ,
105135 ),
106136 LoraAdapterCatalogEntry (
107- id = " translator -lora" ,
108- name = " Translator " ,
109- description = " Improves translation between languages " ,
110- downloadUrl = " https://huggingface.co/Void2377/Qwen/resolve/main/lora/translator-lora -Q8_0.gguf" ,
111- filename = " translator-lora -Q8_0.gguf" ,
112- compatibleModelIds = listOf (" lfm2-350m-q4_k_m " , " lfm2-350m-q8_0 " ),
113- fileSize = 690_176 ,
137+ id = " medical-qa -lora" ,
138+ name = " Medical QA " ,
139+ description = " Enhances medical question answering and health-related responses " ,
140+ downloadUrl = " https://huggingface.co/Void2377/Qwen/resolve/main/lora/medical-qa -Q8_0.gguf" ,
141+ filename = " medical-qa -Q8_0.gguf" ,
142+ compatibleModelIds = listOf (" qwen2.5-0.5b-instruct-q6_k " ),
143+ fileSize = 765_952 ,
114144 defaultScale = 1.0f ,
115145 ),
116146 LoraAdapterCatalogEntry (
117- id = " sentiment -lora" ,
118- name = " Sentiment Analysis " ,
119- description = " Fine-tuned for sentiment analysis tasks " ,
120- downloadUrl = " https://huggingface.co/Void2377/Qwen/resolve/main/lora/sentiment-lora -Q8_0.gguf" ,
121- filename = " sentiment-lora -Q8_0.gguf" ,
122- compatibleModelIds = listOf (" lfm2-350m-q4_k_m " , " lfm2-350m-q8_0 " ),
123- fileSize = 690_176 ,
147+ id = " creative-writing -lora" ,
148+ name = " Creative Writing " ,
149+ description = " Improves creative writing, storytelling, and literary style " ,
150+ downloadUrl = " https://huggingface.co/Void2377/Qwen/resolve/main/lora/creative-writing -Q8_0.gguf" ,
151+ filename = " creative-writing -Q8_0.gguf" ,
152+ compatibleModelIds = listOf (" qwen2.5-0.5b-instruct-q6_k " ),
153+ fileSize = 765_952 ,
124154 defaultScale = 1.0f ,
125155 ),
126156 )
0 commit comments