From dae76ac4189d46696b65385444bc49824b1daab4 Mon Sep 17 00:00:00 2001
From: Matthew Farrellee <matt@cs.wisc.edu>
Date: Thu, 26 Sep 2024 10:50:11 -0400
Subject: [PATCH] add meta/llama-3.2-1b-instruct & meta/llama-3.2-3b-instruct
 chat models and meta/llama-3.2-11b-vision-instruct &
 meta/llama-3.2-90b-vision-instruct vision models

---
 .../langchain_nvidia_ai_endpoints/_statics.py | 25 +++++++++++++++++++
 1 file changed, 25 insertions(+)

diff --git a/libs/ai-endpoints/langchain_nvidia_ai_endpoints/_statics.py b/libs/ai-endpoints/langchain_nvidia_ai_endpoints/_statics.py
index 85078191..c88c1934 100644
--- a/libs/ai-endpoints/langchain_nvidia_ai_endpoints/_statics.py
+++ b/libs/ai-endpoints/langchain_nvidia_ai_endpoints/_statics.py
@@ -423,6 +423,19 @@ def validate_client(self) -> "Model":
         model_type="chat",
         client="ChatNVIDIA",
     ),
+    "meta/llama-3.2-1b-instruct": Model(
+        id="meta/llama-3.2-1b-instruct",
+        model_type="chat",
+        client="ChatNVIDIA",
+        supports_structured_output=True,
+    ),
+    "meta/llama-3.2-3b-instruct": Model(
+        id="meta/llama-3.2-3b-instruct",
+        model_type="chat",
+        client="ChatNVIDIA",
+        supports_tools=True,
+        supports_structured_output=True,
+    ),
 }
 
 QA_MODEL_TABLE = {
@@ -494,6 +507,18 @@ def validate_client(self) -> "Model":
         client="ChatNVIDIA",
         endpoint="https://ai.api.nvidia.com/v1/vlm/nvidia/vila",
     ),
+    "meta/llama-3.2-11b-vision-instruct": Model(
+        id="meta/llama-3.2-11b-vision-instruct",
+        model_type="vlm",
+        client="ChatNVIDIA",
+        endpoint="https://ai.api.nvidia.com/v1/gr/meta/llama-3.2-11b-vision-instruct/chat/completions",
+    ),
+    "meta/llama-3.2-90b-vision-instruct": Model(
+        id="meta/llama-3.2-90b-vision-instruct",
+        model_type="vlm",
+        client="ChatNVIDIA",
+        endpoint="https://ai.api.nvidia.com/v1/gr/meta/llama-3.2-90b-vision-instruct/chat/completions",
+    ),
 }
 
 EMBEDDING_MODEL_TABLE = {