feat: change ollama default model to llama3.1

2025-12-22 13:55:41 +01:00 · 2024-07-29 17:14:46 +02:00 · 2024-07-29 17:14:46 +02:00 · e2b319db92
commit e2b319db92
parent d080969407
6 changed files with 7 additions and 7 deletions
--- a/fern/docs/pages/installation/installation.mdx
+++ b/fern/docs/pages/installation/installation.mdx
@ -135,14 +135,14 @@ Now, start Ollama service (it will start a local inference server, serving both
 ollama serve
 ```

-Install the models to be used, the default settings-ollama.yaml is configured to user mistral 7b LLM (~4GB) and nomic-embed-text Embeddings (~275MB)
+Install the models to be used, the default settings-ollama.yaml is configured to user llama3.1 8b LLM (~4GB) and nomic-embed-text Embeddings (~275MB)

 By default, PGPT will automatically pull models as needed. This behavior can be changed by modifying the `ollama.autopull_models` property.

 In any case, if you want to manually pull models, run the following commands:

 ```bash
-ollama pull mistral
+ollama pull llama3.1
 ollama pull nomic-embed-text
 ```

--- a/fern/docs/pages/installation/troubleshooting.mdx
+++ b/fern/docs/pages/installation/troubleshooting.mdx
@ -24,7 +24,7 @@ PrivateGPT uses the `AutoTokenizer` library to tokenize input text accurately. I
   In your `settings.yaml` file, specify the model you want to use:
   ```yaml
   llm:
-     tokenizer: mistralai/Mistral-7B-Instruct-v0.2
+     tokenizer: meta-llama/Meta-Llama-3.1-8B-Instruct
   ```
 2. **Set Access Token for Gated Models:**
   If you are using a gated model, ensure the `access_token` is set as mentioned in the previous section.
--- a/settings-docker.yaml
+++ b/settings-docker.yaml
@ -20,7 +20,7 @@ sagemaker:
  embedding_endpoint_name: ${PGPT_SAGEMAKER_EMBEDDING_ENDPOINT_NAME:}

 ollama:
-  llm_model: ${PGPT_OLLAMA_LLM_MODEL:mistral}
+  llm_model: ${PGPT_OLLAMA_LLM_MODEL:llama3.1}
  embedding_model: ${PGPT_OLLAMA_EMBEDDING_MODEL:nomic-embed-text}
  api_base: ${PGPT_OLLAMA_API_BASE:http://ollama:11434}
  embedding_api_base: ${PGPT_OLLAMA_EMBEDDING_API_BASE:http://ollama:11434}
--- a/settings-ollama-pg.yaml
+++ b/settings-ollama-pg.yaml
@ -14,7 +14,7 @@ embedding:
  embed_dim: 768

 ollama:
-  llm_model: mistral
+  llm_model: llama3.1
  embedding_model: nomic-embed-text
  api_base: http://localhost:11434

--- a/settings-ollama.yaml
+++ b/settings-ollama.yaml
@ -11,7 +11,7 @@ embedding:
  mode: ollama

 ollama:
-  llm_model: mistral
+  llm_model: llama3.1
  embedding_model: nomic-embed-text
  api_base: http://localhost:11434
  embedding_api_base: http://localhost:11434  # change if your embedding model runs on another ollama
--- a/settings.yaml
+++ b/settings.yaml
@ -111,7 +111,7 @@ openai:
  embedding_api_key: ${OPENAI_API_KEY:}

 ollama:
-  llm_model: llama2
+  llm_model: llama3.1
  embedding_model: nomic-embed-text
  api_base: http://localhost:11434
  embedding_api_base: http://localhost:11434  # change if your embedding model runs on another ollama