Feature/sagemaker embedding (#1161)

* Sagemaker deployed embedding model support --------- Co-authored-by: Pablo Orgaz <pabloogc@gmail.com>
2025-12-22 17:05:41 +01:00 · 2023-11-05 16:16:49 +01:00 · 2023-11-05 16:16:49 +01:00 · ad512e3c42
commit ad512e3c42
parent f29df84301
9 changed files with 114 additions and 7 deletions
--- a/private_gpt/components/llm/custom/sagemaker.py
+++ b/private_gpt/components/llm/custom/sagemaker.py
@ -4,7 +4,7 @@ from __future__ import annotations
 import io
 import json
 import logging
-from typing import TYPE_CHECKING
+from typing import TYPE_CHECKING, Any

 import boto3  # type: ignore
 from llama_index.bridge.pydantic import Field
@ -30,7 +30,6 @@ from llama_index.llms.llama_utils import (

 if TYPE_CHECKING:
    from collections.abc import Sequence
-    from typing import Any

    from llama_index.callbacks import CallbackManager
    from llama_index.llms import (
--- a/private_gpt/components/llm/llm_component.py
+++ b/private_gpt/components/llm/llm_component.py
@ -36,7 +36,7 @@ class LLMComponent:
                from private_gpt.components.llm.custom.sagemaker import SagemakerLLM

                self.llm = SagemakerLLM(
-                    endpoint_name=settings.sagemaker.endpoint_name,
+                    endpoint_name=settings.sagemaker.llm_endpoint_name,
                )
            case "openai":
                from llama_index.llms import OpenAI