From 3d38b1b4e52e84d397b7b220019ee4fd84106939 Mon Sep 17 00:00:00 2001 From: Ian Macleod Date: Fri, 6 Oct 2023 22:37:56 +0000 Subject: [PATCH] update 180b inference framework --- .../domain/use_cases/llm_model_endpoint_use_cases.py | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/model-engine/model_engine_server/domain/use_cases/llm_model_endpoint_use_cases.py b/model-engine/model_engine_server/domain/use_cases/llm_model_endpoint_use_cases.py index 41f0a92c9..5f4eb8724 100644 --- a/model-engine/model_engine_server/domain/use_cases/llm_model_endpoint_use_cases.py +++ b/model-engine/model_engine_server/domain/use_cases/llm_model_endpoint_use_cases.py @@ -102,8 +102,6 @@ "falcon-7b-instruct": "tiiuae/falcon-7b-instruct", "falcon-40b": "tiiuae/falcon-40b", "falcon-40b-instruct": "tiiuae/falcon-40b-instruct", - "falcon-180b": "tiiuae/falcon-180B", - "falcon-180b-chat": "tiiuae/falcon-180B-chat", }, LLMInferenceFramework.VLLM: { "mpt-7b": "mosaicml/mpt-7b", @@ -121,6 +119,8 @@ "falcon-40b-instruct": "tiiuae/falcon-40b-instruct", "mistral-7b": "mistralai/Mistral-7B-v0.1", "mistral-7b-instruct": "mistralai/Mistral-7B-Instruct-v0.1", + "falcon-180b": "tiiuae/falcon-180B", + "falcon-180b-chat": "tiiuae/falcon-180B-chat", }, LLMInferenceFramework.LIGHTLLM: { "llama-7b": "decapoda-research/llama-7b-hf",