Support for BigTrans, Minotaur, Robin, and Vicuna v1.3 models (#451)

* Feature: add Vicuna-v1.3-7B and Vicuna-v1.3-13B

* Feature: add BigTrans-13B

* Feature: add robin,minotour,chronos-hermes,vicuna,trans

* Feature: add robin,minotour,chronos-hermes,vicuna,trans

* Docs: update model max ram required

* Docs: update model max ram required

* Feature: add more quants q2_k,q3_K_L,q4_1,q4_K_M,q8_0 on schema.json

* Fix: missing emojis and typo vicuna models q3_K_L

* Fix: minotaur

* Fix: minotaur

* Fix: schame.json enum k-quants

* Fix: schame.json enum k-quants

---------

Co-authored-by: pabl-o-ce <cye@poscye.com>
This commit is contained in:
PΔBLØ ᄃΞ 2023-06-19 21:16:41 +00:00 committed by GitHub
parent 998e13da37
commit c6c02271e0
No known key found for this signature in database
GPG Key ID: 4AEE18F83AFDEB23
3 changed files with 451 additions and 9 deletions

View File

@ -65,6 +65,8 @@ We currently support the following models:
- Alpaca 🦙
- Alpaca-LoRA-65B
- GPT4-Alpaca-LoRA-30B
- BigTrans 🗺
- BigTrans-13B
- Chronos 🌑
- Chronos-13B
- Chronos-33B
@ -84,10 +86,17 @@ We currently support the following models:
- Llama-Supercot-30B
- Lazarus 💀
- Lazarus-30B
- Minotour 🐃
- Minotaur-15B
- Nous 🧠
- Nous-Hermes-13B
- OpenAssistant 🎙️
- OpenAssistant-30B
- Robin 🏹
- Robin-7B
- Robin-13B
- Robin-33B
- Robin-65B
- Samantha 👩
- Samantha-7B
- Samantha-13B
@ -104,6 +113,8 @@ We currently support the following models:
- Vicuna-v1.1-13B
- VicUnlocked-30B
- VicUnlocked-65B
- Vicuna-v1.3-7B
- Vicuna-v1.3-13B
- Wizard 🧙
- Wizard-Mega-13B
- Wizard-Vicuna-Uncensored-7B
@ -124,14 +135,44 @@ docker cp ./my_weight.bin serge:/usr/src/app/weights/
LLaMA will crash if you don't have enough available memory for the model:
| Model | RAM Required |
|----------|-----------------|
| 7B | 4.5GB |
| 7B-q6_K | 8.03GB |
| 13B | 12GB |
| 13B-q6_K | 13.18GB |
| 30B | 20GB |
| 30B-q6_K | 29.19GB |
| Model | Max RAM Required |
|-------------|------------------|
| 7B | 4.5GB |
| 7B-q2_K | 5.37GB |
| 7B-q3_K_L | 6.10GB |
| 7B-q4_1 | 6.71GB |
| 7B-q4_K_M | 6.58GB |
| 7B-q5_1 | 7.56GB |
| 7B-q5_K_M | 7.28GB |
| 7B-q6_K | 8.03GB |
| 7B-q8_0 | 9.66GB |
| 13B | 12GB |
| 13B-q2_K | 8.01GB |
| 13B-q3_K_L | 9.43GB |
| 13B-q4_1 | 10.64GB |
| 13B-q4_K_M | 10.37GB |
| 13B-q5_1 | 12.26GB |
| 13B-q5_K_M | 11.73GB |
| 13B-q6_K | 13.18GB |
| 13B-q8_0 | 16.33GB |
| 33B | 20GB |
| 33B-q2_K | 16.21GB |
| 33B-q3_K_L | 19.78GB |
| 33B-q4_1 | 22.83GB |
| 33B-q4_K_M | 22.12GB |
| 33B-q5_1 | 26.90GB |
| 33B-q5_K_M | 25.55GB |
| 33B-q6_K | 29.19GB |
| 33B-q8_0 | 37.06GB |
| 65B | 50GB |
| 65B-q2_K | 29.95GB |
| 65B-q3_K_L | 37.15GB |
| 65B-q4_1 | 43.31GB |
| 65B-q4_K_M | 41.85GB |
| 65B-q5_1 | 51.47GB |
| 65B-q5_K_M | 48.74GB |
| 65B-q6_K | 56.06GB |
| 65B-q8_0 | 71.87GB |
## 💬 Support

View File

@ -66,6 +66,52 @@
"disk_space": 26700000000.0
}
]
},
{
"name": "Chronos-Hermes-13B",
"repo": "TheBloke/chronos-hermes-13B-GGML",
"files": [
{
"name": "q2_K",
"filename": "chronos-hermes-13b.ggmlv3.q2_K.bin",
"disk_space": 55100000000.0
},
{
"name": "q3_K_L",
"filename": "chronos-hermes-13b.ggmlv3.q3_K_L.bin",
"disk_space": 69300000000.0
},
{
"name": "q4_1",
"filename": "chronos-hermes-13b.ggmlv3.q4_1.bin",
"disk_space": 81400000000.0
},
{
"name": "q4_K_M",
"filename": "chronos-hermes-13b.ggmlv3.q4_K_M.bin",
"disk_space": 78700000000.0
},
{
"name": "q5_1",
"filename": "chronos-hermes-13b.ggmlv3.q5_1.bin",
"disk_space": 97600000000.0
},
{
"name": "q5_K_M",
"filename": "chronos-hermes-13b.ggmlv3.q5_K_M.bin",
"disk_space": 92300000000.0
},
{
"name": "q6_K",
"filename": "chronos-hermes-13b.ggmlv3.q6_K.bin",
"disk_space": 10700000000.0
},
{
"name": "q8_0",
"filename": "chronos-hermes-13b.ggmlv3.q8_0.bin",
"disk_space": 13800000000.0
}
]
}
]
},
@ -330,6 +376,98 @@
"disk_space": 58700000000.0
}
]
},
{
"name": "Vicuna-v1.3-7B",
"repo": "TheBloke/vicuna-7B-v1.3-GGML",
"files": [
{
"name": "q2_K",
"filename": "vicuna-7b-v1.3.ggmlv3.q2_K.bin",
"disk_space": 28700000000.0
},
{
"name": "q3_K_L",
"filename": "vicuna-7b-v1.3.ggmlv3.q3_K_L.bin",
"disk_space": 36000000000.0
},
{
"name": "q4_1",
"filename": "vicuna-7b-v1.3.ggmlv3.q4_1.bin",
"disk_space": 42100000000.0
},
{
"name": "q4_K_M",
"filename": "vicuna-7b-v1.3.ggmlv3.q4_K_M.bin",
"disk_space": 40800000000.0
},
{
"name": "q5_1",
"filename": "vicuna-7b-v1.3.ggmlv3.q5_1.bin",
"disk_space": 50600000000.0
},
{
"name": "q5_K_M",
"filename": "vicuna-7b-v1.3.ggmlv3.q5_K_M.bin",
"disk_space": 47800000000.0
},
{
"name": "q6_K",
"filename": "vicuna-7b-v1.3.ggmlv3.q6_K.bin",
"disk_space": 55300000000.0
},
{
"name": "q8_0",
"filename": "vicuna-7b-v1.3.ggmlv3.q8_0.bin",
"disk_space": 71600000000.0
}
]
},
{
"name": "Vicuna-v1.3-13B",
"repo": "TheBloke/vicuna-13b-v1.3-GGML",
"files": [
{
"name": "q2_K",
"filename": "vicuna-13b-v1.3.ggmlv3.q2_K.bin",
"disk_space": 55100000000.0
},
{
"name": "q3_K_L",
"filename": "vicuna-13b-v1.3.ggmlv3.q3_K_L.bin",
"disk_space": 69300000000.0
},
{
"name": "q4_1",
"filename": "vicuna-13b-v1.3.ggmlv3.q4_1.bin",
"disk_space": 81400000000.0
},
{
"name": "q4_K_M",
"filename": "vicuna-13b-v1.3.ggmlv3.q4_K_M.bin",
"disk_space": 78700000000.0
},
{
"name": "q5_1",
"filename": "vicuna-13b-v1.3.ggmlv3.q5_1.bin",
"disk_space": 97600000000.0
},
{
"name": "q5_K_M",
"filename": "vicuna-13b-v1.3.ggmlv3.q5_K_M.bin",
"disk_space": 92300000000.0
},
{
"name": "q6_K",
"filename": "vicuna-13b-v1.3.ggmlv3.q6_K.bin",
"disk_space": 10700000000.0
},
{
"name": "q8_0",
"filename": "vicuna-13b-v1.3.ggmlv3.q8_0.bin",
"disk_space": 13800000000.0
}
]
}
]
},
@ -484,6 +622,185 @@
}
]
},
{
"name": "Robin",
"models": [
{
"name": "Robin-7B",
"repo": "TheBloke/robin-7B-v2-GGML",
"files": [
{
"name": "q2_K",
"filename": "robin-7b.ggmlv3.q2_K.bin",
"disk_space": 28700000000.0
},
{
"name": "q3_K_L",
"filename": "robin-7b.ggmlv3.q3_K_L.bin",
"disk_space": 36000000000.0
},
{
"name": "q4_1",
"filename": "robin-7b.ggmlv3.q4_1.bin",
"disk_space": 42100000000.0
},
{
"name": "q4_K_M",
"filename": "robin-7b.ggmlv3.q4_K_M.bin",
"disk_space": 40800000000.0
},
{
"name": "q5_1",
"filename": "robin-7b.ggmlv3.q5_1.bin",
"disk_space": 50600000000.0
},
{
"name": "q5_K_M",
"filename": "robin-7b.ggmlv3.q5_K_M.bin",
"disk_space": 47800000000.0
},
{
"name": "q6_K",
"filename": "robin-7b.ggmlv3.q6_K.bin",
"disk_space": 55300000000.0
},
{
"name": "q8_0",
"filename": "robin-7b.ggmlv3.q8_0.bin",
"disk_space": 71600000000.0
}
]
},
{
"name": "Robin-13B",
"repo": "TheBloke/robin-13B-v2-GGML",
"files": [
{
"name": "q2_K",
"filename": "robin-13b.ggmlv3.q2_K.bin",
"disk_space": 55100000000.0
},
{
"name": "q3_K_L",
"filename": "robin-13b.ggmlv3.q3_K_L.bin",
"disk_space": 69300000000.0
},
{
"name": "q4_1",
"filename": "robin-13b.ggmlv3.q4_1.bin",
"disk_space": 81400000000.0
},
{
"name": "q4_K_M",
"filename": "robin-13b.ggmlv3.q4_K_M.bin",
"disk_space": 78700000000.0
},
{
"name": "q5_1",
"filename": "robin-13b.ggmlv3.q5_1.bin",
"disk_space": 97600000000.0
},
{
"name": "q5_K_M",
"filename": "robin-13b.ggmlv3.q5_K_M.bin",
"disk_space": 92300000000.0
},
{
"name": "q6_K",
"filename": "robin-13b.ggmlv3.q6_K.bin",
"disk_space": 10700000000.0
},
{
"name": "q8_0",
"filename": "robin-13b.ggmlv3.q8_0.bin",
"disk_space": 13800000000.0
}
]
},
{
"name": "Robin-33B",
"repo": "TheBloke/robin-33B-v2-GGML",
"files": [
{
"name": "q2_K",
"filename": "robin-33b.ggmlv3.q2_K.bin",
"disk_space": 13700000000.0
},
{
"name": "q3_K_L",
"filename": "robin-33b.ggmlv3.q3_K_L.bin",
"disk_space": 17300000000.0
},
{
"name": "q4_1",
"filename": "robin-33b.ggmlv3.q4_1.bin",
"disk_space": 20300000000.0
},
{
"name": "q4_K_M",
"filename": "robin-33b.ggmlv3.q4_K_M.bin",
"disk_space": 19600000000.0
},
{
"name": "q5_1",
"filename": "robin-33b.ggmlv3.q5_1.bin",
"disk_space": 24400000000.0
},
{
"name": "q5_K_M",
"filename": "robin-33b.ggmlv3.q5_K_M.bin",
"disk_space": 23000000000.0
},
{
"name": "q6_K",
"filename": "robin-33b.ggmlv3.q6_K.bin",
"disk_space": 26700000000.0
},
{
"name": "q8_0",
"filename": "robin-33b.ggmlv3.q8_0.bin",
"disk_space": 34600000000.0
}
]
},
{
"name": "Robin-65B",
"repo": "TheBloke/robin-65B-v2-GGML",
"files": [
{
"name": "q2_K",
"filename": "robin-65b.ggmlv3.q2_K.bin",
"disk_space": 27500000000.0
},
{
"name": "q3_K_L",
"filename": "robin-65b.ggmlv3.q3_K_L.bin",
"disk_space": 34600000000.0
},
{
"name": "q4_1",
"filename": "robin-65b.ggmlv3.q4_1.bin",
"disk_space": 40800000000.0
},
{
"name": "q4_K_M",
"filename": "robin-65b.ggmlv3.q4_K_M.bin",
"disk_space": 39300000000.0
},
{
"name": "q5_1",
"filename": "robin-65b.ggmlv3.q5_1.bin",
"disk_space": 49000000000.0
},
{
"name": "q5_K_M",
"filename": "robin-65b.ggmlv3.q5_K_M.bin",
"disk_space": 46200000000.0
}
]
}
]
},
{
"name": "misc",
"models": [
@ -541,6 +858,83 @@
"disk_space": 26700000000.0
}
]
},
{
"name": "BigTrans-13B",
"repo": "TheBloke/BigTrans-13B-GGML",
"files": [
{
"name": "q2_K",
"filename": "bigtrans-13b.ggmlv3.q2_K.bin",
"disk_space": 56400000000.0
},
{
"name": "q3_K_L",
"filename": "bigtrans-13b.ggmlv3.q3_K_L.bin",
"disk_space": 70700000000.0
},
{
"name": "q4_1",
"filename": "bigtrans-13b.ggmlv3.q4_1.bin",
"disk_space": 82800000000.0
},
{
"name": "q4_K_M",
"filename": "bigtrans-13b.ggmlv3.q4_K_M.bin",
"disk_space": 80200000000.0
},
{
"name": "q5_1",
"filename": "bigtrans-13b.ggmlv3.q5_1.bin",
"disk_space": 99300000000.0
},
{
"name": "q5_K_M",
"filename": "bigtrans-13b.ggmlv3.q5_K_M.bin",
"disk_space": 94000000000.0
},
{
"name": "q6_K",
"filename": "bigtrans-13b.ggmlv3.q6_K.bin",
"disk_space": 10900000000.0
},
{
"name": "q8_0",
"filename": "bigtrans-13b.ggmlv3.q8_0.bin",
"disk_space": 14100000000.0
}
]
},
{
"name": "Minotaur-15B",
"repo": "TheBloke/minotaur-15B-GGML",
"files": [
{
"name": "q4_0",
"filename": "minotaur-15b.ggmlv3.q4_0.bin",
"disk_space": 10700000000.0
},
{
"name": "q4_1",
"filename": "minotaur-15b.ggmlv3.q4_1.bin",
"disk_space": 11900000000.0
},
{
"name": "q5_0",
"filename": "minotaur-15b.ggmlv3.q5_0.bin",
"disk_space": 13100000000.0
},
{
"name": "q5_1",
"filename": "minotaur-15b.ggmlv3.q5_1.bin",
"disk_space": 14300000000.0
},
{
"name": "q8_0",
"filename": "minotaur-15b.ggmlv3.q8_0.bin",
"disk_space": 20100000000.0
}
]
}
]
}

View File

@ -73,9 +73,16 @@
"Name": {
"type": "string",
"enum": [
"q2_K",
"q3_K_L",
"q4_0",
"q4_1",
"q4_K_M",
"q5_0",
"q5_1",
"q5_K_M",
"q6_K",
"q5_K_M"
"q8_0"
],
"title": "Name"
}