forked from PiDanShouRouZhouXD/Sakura_Launcher_GUI
-
Notifications
You must be signed in to change notification settings - Fork 0
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
- Loading branch information
Showing
5 changed files
with
210 additions
and
205 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -1,111 +1,143 @@ | ||
[ | ||
{ | ||
"repo": "GalTransl-7B-v2.6", | ||
"filename": "GalTransl-7B-v2.6-IQ4_XS.gguf", | ||
"sha256": "f1095c715bd37d6df1f674e86382723fe1fe45c3b4f9c80a4452bcf9128d3eca", | ||
"minimal_gpu_memory_gib": 8, | ||
"size": 4.29, | ||
"recommended_np": { | ||
"8": 2, | ||
"10": 4, | ||
"12": 12, | ||
"16": 16, | ||
"24": 16 | ||
{ | ||
"llamacpp": [ | ||
{ | ||
"repo": "ggerganov/llama.cpp/llama.cpp/releases/download/b3923", | ||
"filename": "llama-b3923-bin-win-cuda-cu12.2.0-x64.zip", | ||
"version": "b3923-CUDA", | ||
"gpu": "Nvidia独显", | ||
"require_cuda": true | ||
}, | ||
"base_model_hf": "Qwen/Qwen1.5-7B", | ||
"bpw": 4.25, | ||
"config_cache": { | ||
"hidden_size": 4096, | ||
"num_attention_heads": 32, | ||
"num_key_value_heads": 32, | ||
"num_hidden_layers": 32, | ||
"parameters": 7721324544.0 | ||
} | ||
}, | ||
{ | ||
"repo": "Sakura-14B-Qwen2.5-v1.0-GGUF", | ||
"filename": "sakura-14b-qwen2.5-v1.0-iq4xs.gguf", | ||
"sha256": "34af88f99c113418d0665d3ceede767c9a12040c9e7c4bb5e87cdb1b1e06e94a", | ||
"minimal_gpu_memory_gib": 10, | ||
"size": 8.19, | ||
"recommended_np": { | ||
"10": 4, | ||
"12": 12, | ||
"16": 16, | ||
"24": 16 | ||
{ | ||
"repo": "PiDanShouRouZhouXD/Sakura_Launcher_GUI/releases/download/v0.0.3-alpha", | ||
"filename": "llama-b3384-bin-win-rocm-avx2-x64.zip", | ||
"version": "b3384-ROCm", | ||
"gpu": "部分AMD独显", | ||
"require_cuda": false | ||
}, | ||
"base_model_hf": "Qwen/Qwen2.5-14B", | ||
"bpw": 4.25, | ||
"config_cache": { | ||
"hidden_size": 5120, | ||
"num_attention_heads": 40, | ||
"num_key_value_heads": 8, | ||
"num_hidden_layers": 48, | ||
"parameters": 14770033664.0 | ||
} | ||
}, | ||
{ | ||
"repo": "Sakura-14B-Qwen2.5-v1.0-GGUF", | ||
"filename": "sakura-14b-qwen2.5-v1.0-q4km.gguf", | ||
"sha256": "c87697cd9c7898464426cb7a1ec5e220755affaa08096766e8d20de1853c2063", | ||
"minimal_gpu_memory_gib": 10, | ||
"size": 8.99, | ||
"recommended_np": { | ||
"10": 1, | ||
"12": 6, | ||
"16": 16, | ||
"24": 16 | ||
{ | ||
"repo": "PiDanShouRouZhouXD/Sakura_Launcher_GUI/releases/download/v0.0.3-alpha", | ||
"filename": "llama-b3534-bin-win-rocm-avx512-x64.zip", | ||
"version": "b3534-ROCm-780m", | ||
"gpu": "部分AMD核显", | ||
"require_cuda": false | ||
}, | ||
"base_model_hf": "Qwen/Qwen2.5-14B", | ||
"bpw": 4.85, | ||
"config_cache": { | ||
"hidden_size": 5120, | ||
"num_attention_heads": 40, | ||
"num_key_value_heads": 8, | ||
"num_hidden_layers": 48, | ||
"parameters": 14770033664.0 | ||
{ | ||
"repo": "ggerganov/llama.cpp/llama.cpp/releases/download/b3923", | ||
"filename": "llama-b3923-bin-win-vulkan-x64.zip", | ||
"version": "b3923-Vulkan", | ||
"gpu": "通用,不推荐", | ||
"require_cuda": false | ||
} | ||
}, | ||
{ | ||
"repo": "Sakura-14B-Qwen2beta-v0.9.2-GGUF", | ||
"filename": "sakura-14b-qwen2beta-v0.9.2-iq4xs.gguf", | ||
"sha256": "254a7e97e5e2a5daa371145e55bb2b0a0a789615dab2d4316189ba089a3ced67", | ||
"minimal_gpu_memory_gib": 12, | ||
"size": 7.91, | ||
"recommended_np": { | ||
"12": 1, | ||
"16": 6, | ||
"24": 8 | ||
], | ||
"sakura": [ | ||
{ | ||
"repo": "GalTransl-7B-v2.6", | ||
"filename": "GalTransl-7B-v2.6-IQ4_XS.gguf", | ||
"sha256": "f1095c715bd37d6df1f674e86382723fe1fe45c3b4f9c80a4452bcf9128d3eca", | ||
"minimal_gpu_memory_gib": 8, | ||
"size": 4.29, | ||
"recommended_np": { | ||
"8": 2, | ||
"10": 4, | ||
"12": 12, | ||
"16": 16, | ||
"24": 16 | ||
}, | ||
"base_model_hf": "Qwen/Qwen1.5-7B", | ||
"bpw": 4.25, | ||
"config_cache": { | ||
"hidden_size": 4096, | ||
"num_attention_heads": 32, | ||
"num_key_value_heads": 32, | ||
"num_hidden_layers": 32, | ||
"parameters": 7721324544.0 | ||
} | ||
}, | ||
"base_model_hf": "Qwen/Qwen1.5-14B", | ||
"bpw": 4.25, | ||
"config_cache": { | ||
"hidden_size": 5120, | ||
"num_attention_heads": 40, | ||
"num_key_value_heads": 40, | ||
"num_hidden_layers": 40, | ||
"parameters": 14167290880.0 | ||
} | ||
}, | ||
{ | ||
"repo": "Sakura-14B-Qwen2beta-v0.9.2-GGUF", | ||
"filename": "sakura-14b-qwen2beta-v0.9.2-q4km.gguf", | ||
"sha256": "8bae1ae35b7327fa7c3a8f3ae495b81a071847d560837de2025e1554364001a5", | ||
"minimal_gpu_memory_gib": 12, | ||
"size": 9.19, | ||
"recommended_np": { | ||
"12": 1, | ||
"16": 6, | ||
"24": 8 | ||
{ | ||
"repo": "Sakura-14B-Qwen2.5-v1.0-GGUF", | ||
"filename": "sakura-14b-qwen2.5-v1.0-iq4xs.gguf", | ||
"sha256": "34af88f99c113418d0665d3ceede767c9a12040c9e7c4bb5e87cdb1b1e06e94a", | ||
"minimal_gpu_memory_gib": 10, | ||
"size": 8.19, | ||
"recommended_np": { | ||
"10": 4, | ||
"12": 12, | ||
"16": 16, | ||
"24": 16 | ||
}, | ||
"base_model_hf": "Qwen/Qwen2.5-14B", | ||
"bpw": 4.25, | ||
"config_cache": { | ||
"hidden_size": 5120, | ||
"num_attention_heads": 40, | ||
"num_key_value_heads": 8, | ||
"num_hidden_layers": 48, | ||
"parameters": 14770033664.0 | ||
} | ||
}, | ||
{ | ||
"repo": "Sakura-14B-Qwen2.5-v1.0-GGUF", | ||
"filename": "sakura-14b-qwen2.5-v1.0-q4km.gguf", | ||
"sha256": "c87697cd9c7898464426cb7a1ec5e220755affaa08096766e8d20de1853c2063", | ||
"minimal_gpu_memory_gib": 10, | ||
"size": 8.99, | ||
"recommended_np": { | ||
"10": 1, | ||
"12": 6, | ||
"16": 16, | ||
"24": 16 | ||
}, | ||
"base_model_hf": "Qwen/Qwen2.5-14B", | ||
"bpw": 4.85, | ||
"config_cache": { | ||
"hidden_size": 5120, | ||
"num_attention_heads": 40, | ||
"num_key_value_heads": 8, | ||
"num_hidden_layers": 48, | ||
"parameters": 14770033664.0 | ||
} | ||
}, | ||
{ | ||
"repo": "Sakura-14B-Qwen2beta-v0.9.2-GGUF", | ||
"filename": "sakura-14b-qwen2beta-v0.9.2-iq4xs.gguf", | ||
"sha256": "254a7e97e5e2a5daa371145e55bb2b0a0a789615dab2d4316189ba089a3ced67", | ||
"minimal_gpu_memory_gib": 12, | ||
"size": 7.91, | ||
"recommended_np": { | ||
"12": 1, | ||
"16": 6, | ||
"24": 8 | ||
}, | ||
"base_model_hf": "Qwen/Qwen1.5-14B", | ||
"bpw": 4.25, | ||
"config_cache": { | ||
"hidden_size": 5120, | ||
"num_attention_heads": 40, | ||
"num_key_value_heads": 40, | ||
"num_hidden_layers": 40, | ||
"parameters": 14167290880.0 | ||
} | ||
}, | ||
"base_model_hf": "Qwen/Qwen1.5-14B", | ||
"bpw": 4.85, | ||
"config_cache": { | ||
"hidden_size": 5120, | ||
"num_attention_heads": 40, | ||
"num_key_value_heads": 40, | ||
"num_hidden_layers": 40, | ||
"parameters": 14167290880.0 | ||
{ | ||
"repo": "Sakura-14B-Qwen2beta-v0.9.2-GGUF", | ||
"filename": "sakura-14b-qwen2beta-v0.9.2-q4km.gguf", | ||
"sha256": "8bae1ae35b7327fa7c3a8f3ae495b81a071847d560837de2025e1554364001a5", | ||
"minimal_gpu_memory_gib": 12, | ||
"size": 9.19, | ||
"recommended_np": { | ||
"12": 1, | ||
"16": 6, | ||
"24": 8 | ||
}, | ||
"base_model_hf": "Qwen/Qwen1.5-14B", | ||
"bpw": 4.85, | ||
"config_cache": { | ||
"hidden_size": 5120, | ||
"num_attention_heads": 40, | ||
"num_key_value_heads": 40, | ||
"num_hidden_layers": 40, | ||
"parameters": 14167290880.0 | ||
} | ||
} | ||
} | ||
] | ||
] | ||
} |
Oops, something went wrong.