diff --git a/services/rag-api/services/chat.py b/services/rag-api/services/chat.py index 801bae8..5a44898 100644 --- a/services/rag-api/services/chat.py +++ b/services/rag-api/services/chat.py @@ -54,6 +54,7 @@ Answer based on the above context:""" payload = { 'model': model, 'stream': True, + 'think': False, # Disable thinking mode for faster responses 'messages': [ {'role': 'system', 'content': SYSTEM_PROMPT}, {'role': 'user', 'content': prompt},