expanded example.env with new LLM model, increased MAX_ARTICLE_LENGTH, updated context size, and extended .gitignore entries

2025-08-06 18:13:50 +02:00
parent e23a8d53d9
commit 092c065809
4 changed files with 6 additions and 2 deletions
--- a/backend/app/config.py
+++ b/backend/app/config.py
@@ -12,7 +12,7 @@ LLM_MODEL = os.getenv("LLM_MODEL", "mistral-nemo:12b")
 LLM_TIMEOUT_SECONDS = int(os.getenv("LLM_TIMEOUT_SECONDS", 180))
 OLLAMA_API_TIMEOUT_SECONDS = int(os.getenv("OLLAMA_API_TIMEOUT_SECONDS", 10))
 ARTICLE_FETCH_TIMEOUT = int(os.getenv("ARTICLE_FETCH_TIMEOUT", 30))
-MAX_ARTICLE_LENGTH = int(os.getenv("MAX_ARTICLE_LENGTH", 5000))
+MAX_ARTICLE_LENGTH = int(os.getenv("MAX_ARTICLE_LENGTH", 10_000))

 frontend_path = os.path.join(
    os.path.dirname(os.path.dirname(os.path.dirname(__file__))),
--- a/backend/app/services.py
+++ b/backend/app/services.py
@@ -209,7 +209,7 @@ class NewsFetcher:
            "format": "json",
            "options": {
                "num_gpu": 1,  # Force GPU usage
-                "num_ctx": 8192,  # Context size
+                "num_ctx": 128_000,  # Context size
            }
        }