mirror of
https://github.com/khoj-ai/khoj.git
synced 2024-11-23 15:38:55 +01:00
Use Jina API Key of Jina web scraper if configured in DB
Previously Jina search didn't API key. Now that it does need API key, we should re-use the API key set in the Jina web scraper config, otherwise fallback to using JINA_API_KEY from environment variable, if either is present. Resolves #978
This commit is contained in:
parent
69ef6829c1
commit
d6eece63f4
1 changed files with 22 additions and 4 deletions
|
@ -11,7 +11,7 @@ from bs4 import BeautifulSoup
|
||||||
from markdownify import markdownify
|
from markdownify import markdownify
|
||||||
|
|
||||||
from khoj.database.adapters import ConversationAdapters
|
from khoj.database.adapters import ConversationAdapters
|
||||||
from khoj.database.models import Agent, KhojUser, WebScraper
|
from khoj.database.models import Agent, KhojUser, ServerChatSettings, WebScraper
|
||||||
from khoj.processor.conversation import prompts
|
from khoj.processor.conversation import prompts
|
||||||
from khoj.routers.helpers import (
|
from khoj.routers.helpers import (
|
||||||
ChatEvent,
|
ChatEvent,
|
||||||
|
@ -362,13 +362,31 @@ async def search_with_jina(query: str, location: LocationData) -> Tuple[str, Dic
|
||||||
encoded_query = urllib.parse.quote(query)
|
encoded_query = urllib.parse.quote(query)
|
||||||
jina_search_api_url = f"{JINA_SEARCH_API_URL}/{encoded_query}"
|
jina_search_api_url = f"{JINA_SEARCH_API_URL}/{encoded_query}"
|
||||||
headers = {"Accept": "application/json"}
|
headers = {"Accept": "application/json"}
|
||||||
if JINA_API_KEY:
|
|
||||||
headers["Authorization"] = f"Bearer {JINA_API_KEY}"
|
# First check for jina scraper configuration in database
|
||||||
|
default_jina_scraper = (
|
||||||
|
await ServerChatSettings.objects.filter()
|
||||||
|
.prefetch_related("web_scraper")
|
||||||
|
.filter(web_scraper__type=WebScraper.WebScraperType.JINA)
|
||||||
|
.afirst()
|
||||||
|
)
|
||||||
|
if default_jina_scraper and default_jina_scraper.web_scraper:
|
||||||
|
jina_scraper = default_jina_scraper.web_scraper
|
||||||
|
else:
|
||||||
|
# Fallback to first configured Jina scraper in DB if no server settings
|
||||||
|
jina_scraper = await WebScraper.objects.filter(type=WebScraper.WebScraperType.JINA).afirst()
|
||||||
|
|
||||||
|
# Get API key from DB scraper config or environment variable
|
||||||
|
api_key = jina_scraper.api_key if jina_scraper and jina_scraper.api_key else JINA_API_KEY
|
||||||
|
|
||||||
|
if api_key:
|
||||||
|
headers["Authorization"] = f"Bearer {api_key}"
|
||||||
|
|
||||||
async with aiohttp.ClientSession() as session:
|
async with aiohttp.ClientSession() as session:
|
||||||
async with session.get(jina_search_api_url, headers=headers) as response:
|
async with session.get(jina_search_api_url, headers=headers) as response:
|
||||||
if response.status != 200:
|
if response.status != 200:
|
||||||
logger.error(await response.text())
|
error_text = await response.text()
|
||||||
|
logger.error(f"Jina search failed: {error_text}")
|
||||||
return query, {}
|
return query, {}
|
||||||
response_json = await response.json()
|
response_json = await response.json()
|
||||||
parsed_response = [
|
parsed_response = [
|
||||||
|
|
Loading…
Reference in a new issue