From 43a4af2cfe47b28e099a86f16ac8e0e7782e3c7d Mon Sep 17 00:00:00 2001 From: Ian Macleod Date: Thu, 9 Nov 2023 17:43:25 +0000 Subject: [PATCH 1/2] adding codellama 34b logic --- docs/model_zoo.md | 3 ++- .../domain/use_cases/llm_model_endpoint_use_cases.py | 2 ++ 2 files changed, 4 insertions(+), 1 deletion(-) diff --git a/docs/model_zoo.md b/docs/model_zoo.md index 0431ea143..fe1ac6e98 100644 --- a/docs/model_zoo.md +++ b/docs/model_zoo.md @@ -24,7 +24,8 @@ Scale hosts the following models in the LLM Engine Model Zoo: | `codellama-7b-instruct` | ✅ | ✅ | text-generation-inference, vllm | | `codellama-13b` | ✅ | | text-generation-inference, vllm | | `codellama-13b-instruct` | ✅ | | text-generation-inference, vllm | -| `codellama-34b` | ✅ | | text-generation-inference, vllm | +| `codellama-34b` | ✅ | ✅ | text-generation-inference, vllm | +| `codellama-34b-instruct` | ✅ | ✅ | text-generation-inference, vllm | ## Usage diff --git a/model-engine/model_engine_server/domain/use_cases/llm_model_endpoint_use_cases.py b/model-engine/model_engine_server/domain/use_cases/llm_model_endpoint_use_cases.py index ed840ec28..433c6cd11 100644 --- a/model-engine/model_engine_server/domain/use_cases/llm_model_endpoint_use_cases.py +++ b/model-engine/model_engine_server/domain/use_cases/llm_model_endpoint_use_cases.py @@ -107,6 +107,7 @@ "codellama-13b": "codellama/CodeLlama-13b-hf", "codellama-13b-instruct": "codellama/CodeLlama-13b-Instruct-hf", "codellama-34b": "codellama/CodeLlama-34b-hf", + "codellama-34b-instruct": "codellama/CodeLlama-34b-Instruct-hf", "llm-jp-13b-instruct-full": "llm-jp/llm-jp-13b-instruct-full-jaster-v1.0", "llm-jp-13b-instruct-full-dolly": "llm-jp/llm-jp-13b-instruct-full-dolly-oasst-v1.0", }, @@ -133,6 +134,7 @@ "codellama-13b": "codellama/CodeLlama-13b-hf", "codellama-13b-instruct": "codellama/CodeLlama-13b-Instruct-hf", "codellama-34b": "codellama/CodeLlama-34b-hf", + "codellama-34b-instruct": "codellama/CodeLlama-34b-Instruct-hf", "mammoth-coder-llama-2-7b": "TIGER-Lab/MAmmoTH-Coder-7B", "mammoth-coder-llama-2-13b": "TIGER-Lab/MAmmoTH-Coder-13B", "mammoth-coder-llama-2-34b": "TIGER-Lab/MAmmoTH-Coder-34B", From abde58987006dbe983dc533ff1aff30de843eff8 Mon Sep 17 00:00:00 2001 From: Ian Macleod Date: Thu, 9 Nov 2023 18:04:29 +0000 Subject: [PATCH 2/2] adding 13b to docs --- docs/model_zoo.md | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/docs/model_zoo.md b/docs/model_zoo.md index fe1ac6e98..ebe9f0825 100644 --- a/docs/model_zoo.md +++ b/docs/model_zoo.md @@ -22,8 +22,8 @@ Scale hosts the following models in the LLM Engine Model Zoo: | `mistral-7b-instruct` | ✅ | ✅ | vllm | | `codellama-7b` | ✅ | ✅ | text-generation-inference, vllm | | `codellama-7b-instruct` | ✅ | ✅ | text-generation-inference, vllm | -| `codellama-13b` | ✅ | | text-generation-inference, vllm | -| `codellama-13b-instruct` | ✅ | | text-generation-inference, vllm | +| `codellama-13b` | ✅ | ✅ | text-generation-inference, vllm | +| `codellama-13b-instruct` | ✅ | ✅ | text-generation-inference, vllm | | `codellama-34b` | ✅ | ✅ | text-generation-inference, vllm | | `codellama-34b-instruct` | ✅ | ✅ | text-generation-inference, vllm |