Feature/sagemaker embedding (#1161)

* Sagemaker deployed embedding model support

---------

Co-authored-by: Pablo Orgaz <pabloogc@gmail.com>
This commit is contained in:
Iván Martínez 2023-11-05 16:16:49 +01:00 committed by GitHub
parent f29df84301
commit ad512e3c42
No known key found for this signature in database
GPG key ID: 4AEE18F83AFDEB23
9 changed files with 114 additions and 7 deletions

14
settings-sagemaker.yaml Normal file
View file

@ -0,0 +1,14 @@
server:
env_name: ${APP_ENV:prod}
port: ${PORT:8001}
ui:
enabled: true
path: /
llm:
mode: sagemaker
sagemaker:
llm_endpoint_name: huggingface-pytorch-tgi-inference-2023-09-25-19-53-32-140
embedding_endpoint_name: huggingface-pytorch-inference-2023-11-03-07-41-36-479