mirror of
https://github.com/khoj-ai/khoj.git
synced 2024-11-27 17:35:07 +01:00
Unwrap any json in md code block, when parsing chat actor responses
This is a more robust way to extract json output requested from gemma-2 (2B, 9B) models which tend to return json in md codeblocks. Other models should remain unaffected by this change. Also removed request to not wrap json in codeblocks from prompts. As code is doing the unwrapping automatically now, when present
This commit is contained in:
parent
ca45fce8ac
commit
acdc3f9470
4 changed files with 11 additions and 2 deletions
|
@ -66,7 +66,7 @@ dependencies = [
|
||||||
"pymupdf >= 1.23.5",
|
"pymupdf >= 1.23.5",
|
||||||
"django == 5.0.7",
|
"django == 5.0.7",
|
||||||
"authlib == 1.2.1",
|
"authlib == 1.2.1",
|
||||||
"llama-cpp-python == 0.2.82",
|
"llama-cpp-python == 0.2.88",
|
||||||
"itsdangerous == 2.1.2",
|
"itsdangerous == 2.1.2",
|
||||||
"httpx == 0.25.0",
|
"httpx == 0.25.0",
|
||||||
"pgvector == 0.2.4",
|
"pgvector == 0.2.4",
|
||||||
|
|
|
@ -103,6 +103,9 @@ def extract_questions_offline(
|
||||||
.replace("']", '"]')
|
.replace("']", '"]')
|
||||||
.replace("', '", '", "')
|
.replace("', '", '", "')
|
||||||
)
|
)
|
||||||
|
# Remove any markdown json codeblock formatting if present (useful for gemma-2)
|
||||||
|
if response.startswith("```json"):
|
||||||
|
response = response[7:-3]
|
||||||
questions: List[str] = json.loads(questions_str)
|
questions: List[str] = json.loads(questions_str)
|
||||||
questions = filter_questions(questions)
|
questions = filter_questions(questions)
|
||||||
except:
|
except:
|
||||||
|
|
|
@ -587,7 +587,7 @@ You are Khoj, an advanced google search assistant. You are tasked with construct
|
||||||
- Official, up-to-date information about you, Khoj, is available at site:khoj.dev, github or pypi.
|
- Official, up-to-date information about you, Khoj, is available at site:khoj.dev, github or pypi.
|
||||||
|
|
||||||
What Google searches, if any, will you need to perform to answer the user's question?
|
What Google searches, if any, will you need to perform to answer the user's question?
|
||||||
Provide search queries as a list of strings in a JSON object. Do not wrap the json in a codeblock.
|
Provide search queries as a list of strings in a JSON object.
|
||||||
Current Date: {current_date}
|
Current Date: {current_date}
|
||||||
User's Location: {location}
|
User's Location: {location}
|
||||||
{username}
|
{username}
|
||||||
|
|
|
@ -279,6 +279,9 @@ async def aget_relevant_information_sources(query: str, conversation_history: di
|
||||||
|
|
||||||
try:
|
try:
|
||||||
response = response.strip()
|
response = response.strip()
|
||||||
|
# Remove any markdown json codeblock formatting if present (useful for gemma-2)
|
||||||
|
if response.startswith("```json"):
|
||||||
|
response = response[7:-3]
|
||||||
response = json.loads(response)
|
response = json.loads(response)
|
||||||
response = [q.strip() for q in response["source"] if q.strip()]
|
response = [q.strip() for q in response["source"] if q.strip()]
|
||||||
if not isinstance(response, list) or not response or len(response) == 0:
|
if not isinstance(response, list) or not response or len(response) == 0:
|
||||||
|
@ -401,6 +404,9 @@ async def generate_online_subqueries(
|
||||||
# Validate that the response is a non-empty, JSON-serializable list
|
# Validate that the response is a non-empty, JSON-serializable list
|
||||||
try:
|
try:
|
||||||
response = response.strip()
|
response = response.strip()
|
||||||
|
# Remove any markdown json codeblock formatting if present (useful for gemma-2)
|
||||||
|
if response.startswith("```json") and response.endswith("```"):
|
||||||
|
response = response[7:-3]
|
||||||
response = json.loads(response)
|
response = json.loads(response)
|
||||||
response = [q.strip() for q in response["queries"] if q.strip()]
|
response = [q.strip() for q in response["queries"] if q.strip()]
|
||||||
if not isinstance(response, list) or not response or len(response) == 0:
|
if not isinstance(response, list) or not response or len(response) == 0:
|
||||||
|
|
Loading…
Reference in a new issue