Add support for Alfred LLM (#936)
* Update models.json Add support of Alfred 40B (supporting 5 languages) * Update README.md Add support of Alfred 40B (supporting 5 languages)
This commit is contained in:
parent
bc10144ed5
commit
c23402153d
@ -57,9 +57,10 @@ Instructions for setting up Serge on Kubernetes can be found in the [wiki](https
|
||||
|
||||
| Category | Models |
|
||||
|:-------------:|:-------|
|
||||
| **Alfred** | 40B |
|
||||
| **CodeLLaMA** | 7B, 13B |
|
||||
| **Falcon** | 7B, 7B-Instruct, 40B, 40B-Instruct |
|
||||
| **LLaMA** | 7B, 13B, 70B |
|
||||
| **LLaMA 2** | 7B, 13B, 70B |
|
||||
| **Med42** | 70B |
|
||||
| **Meditron** | 7B, 70B |
|
||||
| **Mistral** | 7B, 7B-Instruct, 7B-OpenOrca |
|
||||
|
||||
@ -1,4 +1,20 @@
|
||||
[
|
||||
{
|
||||
"name": "Alfred",
|
||||
"models": [
|
||||
{
|
||||
"name": "Alfred-40B",
|
||||
"repo": "TheBloke/alfred-40B-1023-GGUF",
|
||||
"files": [
|
||||
{
|
||||
"name": "q4_K_M",
|
||||
"filename": "alfred-40b-1023.Q4_K_M.gguf",
|
||||
"disk_space": 25500000000.0
|
||||
}
|
||||
]
|
||||
}
|
||||
]
|
||||
},
|
||||
{
|
||||
"name": "PsyMedRP",
|
||||
"models": [
|
||||
|
||||
Loading…
x
Reference in New Issue
Block a user