feat: prompt_style applied to all LLMs + extra LLM params. (#1835)

* Updated prompt_style to be moved to the main LLM setting since all LLMs from llama_index can utilize this. I also included temperature, context window size, max_tokens, max_new_tokens into the openailike to help ensure the settings are consistent from the other implementations. * Removed prompt_style from llamacpp entirely * Fixed settings-local.yaml to include prompt_style in the LLM settings instead of llamacpp.
2025-12-22 07:40:12 +01:00 · 2024-04-30 03:53:10 -04:00 · 2024-04-30 03:53:10 -04:00 · e21bf20c10
commit e21bf20c10
parent c1802e7cf0
4 changed files with 22 additions and 18 deletions
--- a/settings-local.yaml
+++ b/settings-local.yaml
@ -8,9 +8,9 @@ llm:
  max_new_tokens: 512
  context_window: 3900
  tokenizer: mistralai/Mistral-7B-Instruct-v0.2
+  prompt_style: "mistral"

 llamacpp:
-  prompt_style: "mistral"
  llm_hf_repo_id: TheBloke/Mistral-7B-Instruct-v0.2-GGUF
  llm_hf_model_file: mistral-7b-instruct-v0.2.Q4_K_M.gguf

@ -24,4 +24,4 @@ vectorstore:
  database: qdrant

 qdrant:
-  path: local_data/private_gpt/qdrant
+  path: local_data/private_gpt/qdrant