diff --git a/libs/ai-endpoints/langchain_nvidia_ai_endpoints/_statics.py b/libs/ai-endpoints/langchain_nvidia_ai_endpoints/_statics.py index a299252..21affcd 100644 --- a/libs/ai-endpoints/langchain_nvidia_ai_endpoints/_statics.py +++ b/libs/ai-endpoints/langchain_nvidia_ai_endpoints/_statics.py @@ -505,6 +505,11 @@ def validate_client(cls, client: str, values: dict) -> str: model_type="completions", client="NVIDIA", ), + "nvidia/mistral-nemo-minitron-8b-base": Model( + id="nvidia/mistral-nemo-minitron-8b-base", + model_type="completions", + client="NVIDIA", + ), } diff --git a/libs/ai-endpoints/langchain_nvidia_ai_endpoints/llm.py b/libs/ai-endpoints/langchain_nvidia_ai_endpoints/llm.py index de58338..0dac095 100644 --- a/libs/ai-endpoints/langchain_nvidia_ai_endpoints/llm.py +++ b/libs/ai-endpoints/langchain_nvidia_ai_endpoints/llm.py @@ -22,7 +22,7 @@ class Config: validate_assignment = True _client: _NVIDIAClient = PrivateAttr(_NVIDIAClient) - _default_model_name: str = "bigcode/starcoder2-7b" + _default_model_name: str = "nvidia/mistral-nemo-minitron-8b-base" _default_base_url: str = "https://integrate.api.nvidia.com/v1" base_url: str = Field( description="Base url for model listing and invocation",