From e2c2cebf7d44da1ba7c9447fb982dc34056ccef5 Mon Sep 17 00:00:00 2001 From: Juan Calderon-Perez <835733+gaby@users.noreply.github.com> Date: Thu, 7 Dec 2023 00:38:40 -0500 Subject: [PATCH 1/6] Update README.md --- README.md | 8 ++------ 1 file changed, 2 insertions(+), 6 deletions(-) diff --git a/README.md b/README.md index 91e2512..0e77870 100644 --- a/README.md +++ b/README.md @@ -74,11 +74,7 @@ Instructions for setting up Serge on Kubernetes can be found in the [wiki](https | **Vicuna** | 7B-v1.5, 13B-v1.5 | | **Zephyr** | 7B-Alpha, 7B-Beta | -Additional weights can be added to the `serge_weights` volume using `docker cp`: - -```bash -docker cp ./my_weight.bin serge:/usr/src/app/weights/ -``` +Additional models can be requested by opening a GitHub issue. ## ⚠️ Memory Usage @@ -104,5 +100,5 @@ To run Serge in development mode: ```bash git clone https://github.com/serge-chat/serge.git cd serge/ -docker compose -f docker-compose.dev.yml up -d --build +docker compose -f docker-compose.dev.yml up --build ``` From a04de5b170a5bb11d5fa3cdb0058fa1ddf58e1f1 Mon Sep 17 00:00:00 2001 From: "dependabot[bot]" <49699333+dependabot[bot]@users.noreply.github.com> Date: Thu, 7 Dec 2023 08:30:52 -0500 Subject: [PATCH 2/6] Bump actions/setup-python from 4 to 5 (#955) Bumps [actions/setup-python](https://github.com/actions/setup-python) from 4 to 5. - [Release notes](https://github.com/actions/setup-python/releases) - [Commits](https://github.com/actions/setup-python/compare/v4...v5) --- updated-dependencies: - dependency-name: actions/setup-python dependency-type: direct:production update-type: version-update:semver-major ... Signed-off-by: dependabot[bot] Co-authored-by: dependabot[bot] <49699333+dependabot[bot]@users.noreply.github.com> --- .github/workflows/ci.yml | 4 ++-- .github/workflows/helm-test.yml | 2 +- .github/workflows/model-check.yml | 2 +- 3 files changed, 4 insertions(+), 4 deletions(-) diff --git a/.github/workflows/ci.yml b/.github/workflows/ci.yml index e809509..394909c 100644 --- a/.github/workflows/ci.yml +++ b/.github/workflows/ci.yml @@ -49,7 +49,7 @@ jobs: runs-on: ubuntu-latest steps: - uses: actions/checkout@v4 - - uses: actions/setup-python@v4 + - uses: actions/setup-python@v5 with: python-version: "3.11" - name: Install dependencies with poetry @@ -76,7 +76,7 @@ jobs: runs-on: ubuntu-latest steps: - uses: actions/checkout@v4 - - uses: actions/setup-python@v4 + - uses: actions/setup-python@v5 with: python-version: "3.11" - name: Run ruff check diff --git a/.github/workflows/helm-test.yml b/.github/workflows/helm-test.yml index 0a2949b..c3fdde7 100644 --- a/.github/workflows/helm-test.yml +++ b/.github/workflows/helm-test.yml @@ -41,7 +41,7 @@ jobs: with: version: v3.12.3 - - uses: actions/setup-python@v4 + - uses: actions/setup-python@v5 with: python-version: '3.10' check-latest: true diff --git a/.github/workflows/model-check.yml b/.github/workflows/model-check.yml index df83848..b590d57 100644 --- a/.github/workflows/model-check.yml +++ b/.github/workflows/model-check.yml @@ -34,7 +34,7 @@ jobs: runs-on: ubuntu-latest steps: - uses: actions/checkout@v4 - - uses: actions/setup-python@v4 + - uses: actions/setup-python@v5 with: python-version: "3.11" - name: Install dependencies with poetry From 005177a51290fb286b57b514717ac2852e0e9a53 Mon Sep 17 00:00:00 2001 From: "dependabot[bot]" <49699333+dependabot[bot]@users.noreply.github.com> Date: Thu, 7 Dec 2023 08:31:08 -0500 Subject: [PATCH 3/6] Bump typescript from 5.3.2 to 5.3.3 in /web (#954) Bumps [typescript](https://github.com/Microsoft/TypeScript) from 5.3.2 to 5.3.3. - [Release notes](https://github.com/Microsoft/TypeScript/releases) - [Commits](https://github.com/Microsoft/TypeScript/compare/v5.3.2...v5.3.3) --- updated-dependencies: - dependency-name: typescript dependency-type: direct:development update-type: version-update:semver-patch ... Signed-off-by: dependabot[bot] Co-authored-by: dependabot[bot] <49699333+dependabot[bot]@users.noreply.github.com> --- web/package-lock.json | 8 ++++---- web/package.json | 2 +- 2 files changed, 5 insertions(+), 5 deletions(-) diff --git a/web/package-lock.json b/web/package-lock.json index e1d9ba7..68df689 100644 --- a/web/package-lock.json +++ b/web/package-lock.json @@ -39,7 +39,7 @@ "svelte-check": "^3.6.2", "tailwindcss": "^3.3.6", "tslib": "^2.6.2", - "typescript": "^5.3.2", + "typescript": "^5.3.3", "vite": "^4.5.1" } }, @@ -5572,9 +5572,9 @@ } }, "node_modules/typescript": { - "version": "5.3.2", - "resolved": "https://registry.npmjs.org/typescript/-/typescript-5.3.2.tgz", - "integrity": "sha512-6l+RyNy7oAHDfxC4FzSJcz9vnjTKxrLpDG5M2Vu4SHRVNg6xzqZp6LYSR9zjqQTu8DU/f5xwxUdADOkbrIX2gQ==", + "version": "5.3.3", + "resolved": "https://registry.npmjs.org/typescript/-/typescript-5.3.3.tgz", + "integrity": "sha512-pXWcraxM0uxAS+tN0AG/BF2TyqmHO014Z070UsJ+pFvYuRSq8KH8DmWpnbXe0pEPDHXZV3FcAbJkijJ5oNEnWw==", "dev": true, "bin": { "tsc": "bin/tsc", diff --git a/web/package.json b/web/package.json index 513f6e4..096bd05 100644 --- a/web/package.json +++ b/web/package.json @@ -32,7 +32,7 @@ "svelte-check": "^3.6.2", "tailwindcss": "^3.3.6", "tslib": "^2.6.2", - "typescript": "^5.3.2", + "typescript": "^5.3.3", "vite": "^4.5.1" }, "type": "module", From 0ef3438180712dfc5ab332c932ecc0b56d14cbf2 Mon Sep 17 00:00:00 2001 From: "dependabot[bot]" <49699333+dependabot[bot]@users.noreply.github.com> Date: Fri, 8 Dec 2023 07:51:08 -0500 Subject: [PATCH 4/6] Bump markdown-it from 13.0.2 to 14.0.0 in /web (#957) Bumps [markdown-it](https://github.com/markdown-it/markdown-it) from 13.0.2 to 14.0.0. - [Changelog](https://github.com/markdown-it/markdown-it/blob/master/CHANGELOG.md) - [Commits](https://github.com/markdown-it/markdown-it/compare/13.0.2...14.0.0) --- updated-dependencies: - dependency-name: markdown-it dependency-type: direct:production update-type: version-update:semver-major ... Signed-off-by: dependabot[bot] Co-authored-by: dependabot[bot] <49699333+dependabot[bot]@users.noreply.github.com> --- web/package-lock.json | 53 +++++++++++++++++++++++++------------------ web/package.json | 2 +- 2 files changed, 32 insertions(+), 23 deletions(-) diff --git a/web/package-lock.json b/web/package-lock.json index 68df689..a0132ea 100644 --- a/web/package-lock.json +++ b/web/package-lock.json @@ -13,7 +13,7 @@ "clipboard": "^2.0.11", "daisyui": "^4.4.19", "highlight.js": "^11.9.0", - "markdown-it": "^13.0.2", + "markdown-it": "^14.0.0", "markdown-it-highlightjs": "^4.0.1", "prettier-plugin-svelte": "^3.1.2", "prettier-plugin-tailwindcss": "^0.5.9" @@ -1971,9 +1971,9 @@ "dev": true }, "node_modules/entities": { - "version": "3.0.1", - "resolved": "https://registry.npmjs.org/entities/-/entities-3.0.1.tgz", - "integrity": "sha512-WiyBqoomrwMdFG1e0kqvASYfnlb0lp8M5o5Fw2OFq1hNZxxcNk8Ik0Xm7LxzBhuidnZB/UtBqVCgUz3kBOP51Q==", + "version": "4.5.0", + "resolved": "https://registry.npmjs.org/entities/-/entities-4.5.0.tgz", + "integrity": "sha512-V0hjH4dGPh9Ao5p0MoRY6BVqtwCjhz6vI5LT8AJ55H+4g9/4vbHx1I54fS0XuclLhDHArPQCiMjDxjaL8fPxhw==", "engines": { "node": ">=0.12" }, @@ -3542,11 +3542,11 @@ "dev": true }, "node_modules/linkify-it": { - "version": "4.0.1", - "resolved": "https://registry.npmjs.org/linkify-it/-/linkify-it-4.0.1.tgz", - "integrity": "sha512-C7bfi1UZmoj8+PQx22XyeXCuBlokoyWQL5pWSP+EI6nzRylyThouddufc2c1NDIcP9k5agmN9fLpA7VNJfIiqw==", + "version": "5.0.0", + "resolved": "https://registry.npmjs.org/linkify-it/-/linkify-it-5.0.0.tgz", + "integrity": "sha512-5aHCbzQRADcdP+ATqnDuhhJ/MRIqDkZX5pyjFHRRysS8vZ5AbqGEoFIb6pYHPZ+L/OC2Lc+xT8uHVVR5CAK/wQ==", "dependencies": { - "uc.micro": "^1.0.1" + "uc.micro": "^2.0.0" } }, "node_modules/locate-character": { @@ -3606,18 +3606,19 @@ } }, "node_modules/markdown-it": { - "version": "13.0.2", - "resolved": "https://registry.npmjs.org/markdown-it/-/markdown-it-13.0.2.tgz", - "integrity": "sha512-FtwnEuuK+2yVU7goGn/MJ0WBZMM9ZPgU9spqlFs7/A/pDIUNSOQZhUgOqYCficIuR2QaFnrt8LHqBWsbTAoI5w==", + "version": "14.0.0", + "resolved": "https://registry.npmjs.org/markdown-it/-/markdown-it-14.0.0.tgz", + "integrity": "sha512-seFjF0FIcPt4P9U39Bq1JYblX0KZCjDLFFQPHpL5AzHpqPEKtosxmdq/LTVZnjfH7tjt9BxStm+wXcDBNuYmzw==", "dependencies": { "argparse": "^2.0.1", - "entities": "~3.0.1", - "linkify-it": "^4.0.1", - "mdurl": "^1.0.1", - "uc.micro": "^1.0.5" + "entities": "^4.4.0", + "linkify-it": "^5.0.0", + "mdurl": "^2.0.0", + "punycode.js": "^2.3.1", + "uc.micro": "^2.0.0" }, "bin": { - "markdown-it": "bin/markdown-it.js" + "markdown-it": "bin/markdown-it.mjs" } }, "node_modules/markdown-it-highlightjs": { @@ -3634,9 +3635,9 @@ "integrity": "sha512-GaqWWShW4kv/G9IEucWScBx9G1/vsFZZJUO+tD26M8J8z3Kw5RDQjaoZe03YAClgeS/SWPOcb4nkFBTEi5DUEA==" }, "node_modules/mdurl": { - "version": "1.0.1", - "resolved": "https://registry.npmjs.org/mdurl/-/mdurl-1.0.1.tgz", - "integrity": "sha512-/sKlQJCBYVY9Ers9hqzKou4H6V5UWc/M59TH2dvkt+84itfnq7uFOMLpOiOS4ujvHP4etln18fmIxA5R5fll0g==" + "version": "2.0.0", + "resolved": "https://registry.npmjs.org/mdurl/-/mdurl-2.0.0.tgz", + "integrity": "sha512-Lf+9+2r+Tdp5wXDXC4PcIBjTDtq4UKjCPMQhKIuzpJNW0b96kVqSwW0bT7FhRSfmAiFYgP+SCRvdrDozfh0U5w==" }, "node_modules/merge-stream": { "version": "2.0.0", @@ -4437,6 +4438,14 @@ "node": ">=6" } }, + "node_modules/punycode.js": { + "version": "2.3.1", + "resolved": "https://registry.npmjs.org/punycode.js/-/punycode.js-2.3.1.tgz", + "integrity": "sha512-uxFIHU0YlHYhDQtV4R9J6a52SLx28BCjT+4ieh7IGbgwVJWO+km431c4yRlREUAsAmt/uMjQUyQHNEPf0M39CA==", + "engines": { + "node": ">=6" + } + }, "node_modules/queue-microtask": { "version": "1.2.3", "resolved": "https://registry.npmjs.org/queue-microtask/-/queue-microtask-1.2.3.tgz", @@ -5585,9 +5594,9 @@ } }, "node_modules/uc.micro": { - "version": "1.0.6", - "resolved": "https://registry.npmjs.org/uc.micro/-/uc.micro-1.0.6.tgz", - "integrity": "sha512-8Y75pvTYkLJW2hWQHXxoqRgV7qb9B+9vFEtidML+7koHUFapnVJAZ6cKs+Qjz5Aw3aZWHMC6u0wJE3At+nSGwA==" + "version": "2.0.0", + "resolved": "https://registry.npmjs.org/uc.micro/-/uc.micro-2.0.0.tgz", + "integrity": "sha512-DffL94LsNOccVn4hyfRe5rdKa273swqeA5DJpMOeFmEn1wCDc7nAbbB0gXlgBCL7TNzeTv6G7XVWzan7iJtfig==" }, "node_modules/unbox-primitive": { "version": "1.0.2", diff --git a/web/package.json b/web/package.json index 096bd05..6877b7d 100644 --- a/web/package.json +++ b/web/package.json @@ -42,7 +42,7 @@ "clipboard": "^2.0.11", "daisyui": "^4.4.19", "highlight.js": "^11.9.0", - "markdown-it": "^13.0.2", + "markdown-it": "^14.0.0", "markdown-it-highlightjs": "^4.0.1", "prettier-plugin-svelte": "^3.1.2", "prettier-plugin-tailwindcss": "^0.5.9" From 51ef0b3b6173a7725b4a8fb1f0e67f22d06d2f89 Mon Sep 17 00:00:00 2001 From: Juan Calderon-Perez <835733+gaby@users.noreply.github.com> Date: Fri, 8 Dec 2023 09:24:06 -0500 Subject: [PATCH 5/6] Add Zephyr 3B (#959) --- README.md | 2 +- api/src/serge/data/models.json | 11 +++++++++++ 2 files changed, 12 insertions(+), 1 deletion(-) diff --git a/README.md b/README.md index 0e77870..51f0b84 100644 --- a/README.md +++ b/README.md @@ -72,7 +72,7 @@ Instructions for setting up Serge on Kubernetes can be found in the [wiki](https | **PsyMedRP** | 13B-v1, 20B-v1 | | **Starling LM** | 7B-Alpha | | **Vicuna** | 7B-v1.5, 13B-v1.5 | -| **Zephyr** | 7B-Alpha, 7B-Beta | +| **Zephyr** | 3B, 7B-Alpha, 7B-Beta | Additional models can be requested by opening a GitHub issue. diff --git a/api/src/serge/data/models.json b/api/src/serge/data/models.json index 3d6c4ba..c09718e 100644 --- a/api/src/serge/data/models.json +++ b/api/src/serge/data/models.json @@ -467,6 +467,17 @@ { "name": "Zephyr", "models": [ + { + "name": "Zephyr-3B", + "repo": "TheBloke/stablelm-zephyr-3b-GGUF", + "files": [ + { + "name": "q4_K_M", + "filename": "stablelm-zephyr-3b.Q4_K_M.gguf", + "disk_space": 1708595648.0 + } + ] + }, { "name": "Zephyr-7B-Alpha", "repo": "TheBloke/zephyr-7B-alpha-GGUF", From 9bcab1297c801bcfd9acc36baffb70b93d4c3a6e Mon Sep 17 00:00:00 2001 From: Olivier DEBAUCHE Date: Sat, 9 Dec 2023 00:19:50 +0100 Subject: [PATCH 6/6] Add Python-Code 13B and 33B (#960) * Add Python-Code 13B and 33B * Add Python-Code 13B and 33B * Update README.md --------- Co-authored-by: Juan Calderon-Perez <835733+gaby@users.noreply.github.com> --- README.md | 1 + api/src/serge/data/models.json | 63 ++++++++++++++++++++++++---------- 2 files changed, 46 insertions(+), 18 deletions(-) diff --git a/README.md b/README.md index 51f0b84..0b51b63 100644 --- a/README.md +++ b/README.md @@ -69,6 +69,7 @@ Instructions for setting up Serge on Kubernetes can be found in the [wiki](https | **OpenChat** | 7B-v3.5 | | **OpenLLaMA** | 3B-v2, 7B-v2, 13B-v2 | | **Orca 2** | 7B, 13B | +| **Python Code** | 13B, 33B | | **PsyMedRP** | 13B-v1, 20B-v1 | | **Starling LM** | 7B-Alpha | | **Vicuna** | 7B-v1.5, 13B-v1.5 | diff --git a/api/src/serge/data/models.json b/api/src/serge/data/models.json index c09718e..e8245f6 100644 --- a/api/src/serge/data/models.json +++ b/api/src/serge/data/models.json @@ -350,23 +350,7 @@ ] } ] - }, - { - "name": "SlimOrca", - "models": [ - { - "name": "SlimOrca-13B", - "repo": "TheBloke/SlimOrca-13B-GGUF", - "files": [ - { - "name": "q4_K_M", - "filename": "slimorca-13b.Q4_K_M.gguf", - "disk_space": 7865956352.0 - } - ] - } - ] - }, + }, { "name": "Orca_2", "models": [ @@ -393,7 +377,34 @@ ] } ] - }, + }, + { + "name": "Python-Code", + "models": [ + { + "name": "Python-Code-13B", + "repo": "TheBloke/Python-Code-13B-GGUF", + "files": [ + { + "name": "q4_K_M", + "filename": "python-code-13b.Q4_K_M.gguf", + "disk_space": 7865956352.0 + } + ] + }, + { + "name": "Python-Code-33B", + "repo": "TheBloke/Python-Code-33B-GGUF", + "files": [ + { + "name": "q4_K_M", + "filename": "python-code-33b.Q4_K_M.gguf", + "disk_space": 19621140000.0 + } + ] + } + ] + }, { "name": "PsyMedRP", "models": [ @@ -421,6 +432,22 @@ } ] }, + { + "name": "SlimOrca", + "models": [ + { + "name": "SlimOrca-13B", + "repo": "TheBloke/SlimOrca-13B-GGUF", + "files": [ + { + "name": "q4_K_M", + "filename": "slimorca-13b.Q4_K_M.gguf", + "disk_space": 7865956352.0 + } + ] + } + ] + }, { "name": "StarlingLM", "models": [