add dynamic model listing support (#13398)

1a0e705d · Matthew Farrellee · GitHub · 0928dc25 · 1a0e705d · 1a0e705d
Unverified Commit 1a0e705d authored 11 months ago by Matthew Farrellee Committed by GitHub 11 months ago
--- a/llama-index-integrations/llms/llama-index-llms-nvidia/llama_index/llms/nvidia/base.py
+++ b/llama-index-integrations/llms/llama-index-llms-nvidia/llama_index/llms/nvidia/base.py
@@ -10,7 +10,6 @@ from llama_index.core.base.llms.generic_utils import (
    get_from_param_or_env,
 )
-from llama_index.llms.nvidia.utils import API_CATALOG_MODELS
 from llama_index.llms.openai_like import OpenAILike
@@ -54,10 +53,19 @@ class NVIDIA(OpenAILike):
    @property
    def available_models(self) -> List[Model]:
-        ids = API_CATALOG_MODELS.keys()
+        exclude = {
+            "mistralai/mixtral-8x22b-v0.1",  # not a /chat/completion endpoint
+        }
+        # do not exclude models in nim mode. the nim administrator has control
+        # over the model name and may deploy an excluded name on the nim's
+        # /chat/completion endpoint.
        if self._mode == "nim":
-            ids = [model.id for model in self._get_client().models.list()]
+            exclude = set()
-        return [Model(id=name) for name in ids]
+        return [
+            model
+            for model in self._get_client().models.list().data
+            if model.id not in exclude
+        ]
    @classmethod
    def class_name(cls) -> str:

--- a/llama-index-integrations/llms/llama-index-llms-nvidia/pyproject.toml
+++ b/llama-index-integrations/llms/llama-index-llms-nvidia/pyproject.toml
@@ -30,7 +30,7 @@ license = "MIT"
 name = "llama-index-llms-nvidia"
 packages = [{include = "llama_index/"}]
 readme = "README.md"
-version = "0.1.1"
+version = "0.1.2"
 [tool.poetry.dependencies]
 python = ">=3.8.1,<4.0"

--- a/llama-index-integrations/llms/llama-index-llms-nvidia/tests/test_integration.py
+++ b/llama-index-integrations/llms/llama-index-llms-nvidia/tests/test_integration.py
@@ -73,3 +73,16 @@ async def test_astream_complete(chat_model: str, mode: dict) -> None:
    responses = [response async for response in gen]
    assert all(isinstance(response, CompletionResponse) for response in responses)
    assert all(isinstance(response.delta, str) for response in responses)
+@pytest.mark.integration()
+@pytest.mark.parametrize(
+    "excluded",
+    [
+        "mistralai/mixtral-8x22b-v0.1",  # not a /chat/completion endpoint
+    ],
+)
+def test_exclude_models(mode: dict, excluded: str) -> None:
+    assert excluded not in [
+        model.id for model in NVIDIA().mode(**mode).available_models
+    ]