From ac5d18a7cbb9f50796c2986dd2862f282aff3355 Mon Sep 17 00:00:00 2001 From: Matthew Farrellee Date: Tue, 27 Aug 2024 17:00:43 -0400 Subject: [PATCH] set default model to nvidia/mistral-nemo-minitron-8b-base --- libs/ai-endpoints/langchain_nvidia_ai_endpoints/_statics.py | 5 +++++ libs/ai-endpoints/langchain_nvidia_ai_endpoints/llm.py | 2 +- 2 files changed, 6 insertions(+), 1 deletion(-) diff --git a/libs/ai-endpoints/langchain_nvidia_ai_endpoints/_statics.py b/libs/ai-endpoints/langchain_nvidia_ai_endpoints/_statics.py index a299252..21affcd 100644 --- a/libs/ai-endpoints/langchain_nvidia_ai_endpoints/_statics.py +++ b/libs/ai-endpoints/langchain_nvidia_ai_endpoints/_statics.py @@ -505,6 +505,11 @@ def validate_client(cls, client: str, values: dict) -> str: model_type="completions", client="NVIDIA", ), + "nvidia/mistral-nemo-minitron-8b-base": Model( + id="nvidia/mistral-nemo-minitron-8b-base", + model_type="completions", + client="NVIDIA", + ), } diff --git a/libs/ai-endpoints/langchain_nvidia_ai_endpoints/llm.py b/libs/ai-endpoints/langchain_nvidia_ai_endpoints/llm.py index de58338..0dac095 100644 --- a/libs/ai-endpoints/langchain_nvidia_ai_endpoints/llm.py +++ b/libs/ai-endpoints/langchain_nvidia_ai_endpoints/llm.py @@ -22,7 +22,7 @@ class Config: validate_assignment = True _client: _NVIDIAClient = PrivateAttr(_NVIDIAClient) - _default_model_name: str = "bigcode/starcoder2-7b" + _default_model_name: str = "nvidia/mistral-nemo-minitron-8b-base" _default_base_url: str = "https://integrate.api.nvidia.com/v1" base_url: str = Field( description="Base url for model listing and invocation",