Feature/sagemaker embedding (#1161)

* Sagemaker deployed embedding model support

---------

Co-authored-by: Pablo Orgaz <pabloogc@gmail.com>
This commit is contained in:
Iván Martínez 2023-11-05 16:16:49 +01:00 committed by GitHub
parent f29df84301
commit ad512e3c42
No known key found for this signature in database
GPG key ID: 4AEE18F83AFDEB23
9 changed files with 114 additions and 7 deletions

View file

@ -4,7 +4,7 @@ from __future__ import annotations
import io
import json
import logging
from typing import TYPE_CHECKING
from typing import TYPE_CHECKING, Any
import boto3 # type: ignore
from llama_index.bridge.pydantic import Field
@ -30,7 +30,6 @@ from llama_index.llms.llama_utils import (
if TYPE_CHECKING:
from collections.abc import Sequence
from typing import Any
from llama_index.callbacks import CallbackManager
from llama_index.llms import (

View file

@ -36,7 +36,7 @@ class LLMComponent:
from private_gpt.components.llm.custom.sagemaker import SagemakerLLM
self.llm = SagemakerLLM(
endpoint_name=settings.sagemaker.endpoint_name,
endpoint_name=settings.sagemaker.llm_endpoint_name,
)
case "openai":
from llama_index.llms import OpenAI