update models
All checks were successful
Build, Push and Redeploy Docker Image / build-and-push (push) Successful in 5m18s
All checks were successful
Build, Push and Redeploy Docker Image / build-and-push (push) Successful in 5m18s
This commit is contained in:
@@ -15,25 +15,9 @@ model_configs = {
|
||||
"Qwen2.5-3B-Instruct-w8w8": {"filename": "Qwen2.5-3B-Instruct-w8w8.rkllm"}
|
||||
}
|
||||
},
|
||||
"DeepSeek-R1-Distill-Qwen-1.5B_FP16_RK3588": {
|
||||
"Qwen3-4B-Instruct-2507-F16": {
|
||||
"base_config": {
|
||||
"st_model_id": "Qwen/Qwen2.5-14B-Instruct",
|
||||
"max_context_len": 128000,
|
||||
"max_new_tokens": 8192,
|
||||
"top_k": 5,
|
||||
"top_p": 0.95,
|
||||
"temperature": 0.6,
|
||||
"repeat_penalty": 1.00,
|
||||
"frequency_penalty": 0.2,
|
||||
"system_prompt": "You are Deepseek. You are a helpful assistant."
|
||||
},
|
||||
"models": {
|
||||
"DeepSeek-R1-Distill-Qwen-1.5B_FP16_RK3588": {"filename": "DeepSeek-R1-Distill-Qwen-1.5B_FP16_RK3588.rkllm"}
|
||||
}
|
||||
},
|
||||
"Qwen2.5-Coder-3B-Instruct-w8w8": {
|
||||
"base_config": {
|
||||
"st_model_id": "Qwen/Qwen2.5-14B-Instruct",
|
||||
"st_model_id": "unsloth/Qwen3-4B-Instruct-2507-GGUF",
|
||||
"max_context_len": 128000,
|
||||
"max_new_tokens": 8192,
|
||||
"top_k": 5,
|
||||
@@ -44,7 +28,7 @@ model_configs = {
|
||||
"system_prompt": "You are Qwen, created by Alibaba Cloud. You are a helpful assistant"
|
||||
},
|
||||
"models": {
|
||||
"Qwen2.5-Coder-3B-Instruct-w8w8": {"filename": "Qwen2.5-Coder-3B-Instruct-w8w8.rkllm"}
|
||||
"Qwen3-4B-Instruct-2507-F16": {"filename": "Qwen3-4B-Instruct-2507-F16.rkllm"}
|
||||
}
|
||||
}
|
||||
# "LLaMA-Mesh": {
|
||||
|
||||
Reference in New Issue
Block a user