Only enforce json output in supported AI model APIs

debanjum · debanjum · commit 639b5a46ee69 · 2025-03-19T21:12:02.000+05:30
Deepseek reasoner does not support json object or schema via deepseek API Azure Ai API does not support json schema Resolves #1126
diff --git a/src/khoj/processor/conversation/openai/gpt.py b/src/khoj/processor/conversation/openai/gpt.py
@@ -8,10 +8,12 @@
 from khoj.database.models import Agent, ChatModel, KhojUser
 from khoj.processor.conversation import prompts
 from khoj.processor.conversation.openai.utils import (
+    ai_api_supports_json_enforcement,
     chat_completion_with_backoff,
     completion_with_backoff,
 )
 from khoj.processor.conversation.utils import (
+    JsonSupport,
     clean_json,
     construct_structured_message,
     generate_chatml_messages_with_context,
@@ -126,13 +128,14 @@ def send_message_to_model(
     """
 
     # Get Response from GPT
+    json_support = ai_api_supports_json_enforcement(model, api_base_url)
     return completion_with_backoff(
         messages=messages,
         model_name=model,
         openai_api_key=api_key,
         temperature=temperature,
         api_base_url=api_base_url,
-        model_kwargs={"response_format": {"type": response_type}},
+        model_kwargs={"response_format": {"type": response_type}} if json_support >= JsonSupport.OBJECT else {},
         tracer=tracer,
     )
 
diff --git a/src/khoj/processor/conversation/openai/utils.py b/src/khoj/processor/conversation/openai/utils.py
@@ -16,6 +16,7 @@
 )
 
 from khoj.processor.conversation.utils import (
+    JsonSupport,
     ThreadedGenerator,
     commit_conversation_trace,
 )
@@ -245,3 +246,11 @@ def llm_thread(
         logger.error(f"Error in llm_thread: {e}", exc_info=True)
     finally:
         g.close()
+
+
+def ai_api_supports_json_enforcement(model_name: str, api_base_url: str = None) -> JsonSupport:
+    if model_name.startswith("deepseek-reasoner"):
+        return JsonSupport.NONE
+    if ".ai.azure.com" in api_base_url:
+        return JsonSupport.OBJECT
+    return JsonSupport.SCHEMA
diff --git a/src/khoj/processor/conversation/utils.py b/src/khoj/processor/conversation/utils.py
@@ -878,3 +878,9 @@ def safe_serialize(content: Any) -> str:
             return str(content)
 
     return "\n".join([f"{json.dumps(safe_serialize(message.content))[:max_length]}..." for message in messages])
+
+
+class JsonSupport(int, Enum):
+    NONE = 0
+    OBJECT = 1
+    SCHEMA = 2