2021-08-22 03:47:55 +02:00
|
|
|
content-type:
|
|
|
|
org:
|
2022-08-04 21:57:35 +02:00
|
|
|
input-files: # ["/path/to/org-file.org"] REQUIRED IF input-filter IS NOT SET OR
|
2023-01-09 02:40:18 +01:00
|
|
|
input-filter: # ["/path/to/org/*.org"] REQUIRED IF input-files IS NOT SET
|
2022-08-04 21:57:35 +02:00
|
|
|
compressed-jsonl: "~/.khoj/content/org/org.jsonl.gz"
|
|
|
|
embeddings-file: "~/.khoj/content/org/org_embeddings.pt"
|
2022-09-11 16:30:02 +02:00
|
|
|
index_heading_entries: false # Set to true to index entries with empty body
|
2021-08-22 03:47:55 +02:00
|
|
|
|
2022-07-21 19:54:30 +02:00
|
|
|
markdown:
|
2022-08-04 21:57:35 +02:00
|
|
|
input-files: # ["/path/to/markdown-file.md"] REQUIRED IF input-filter IS NOT SET OR
|
2023-01-09 01:08:00 +01:00
|
|
|
input-filter: # ["/path/to/markdown/*.md"] REQUIRED IF input-files IS NOT SET
|
2022-08-04 21:57:35 +02:00
|
|
|
compressed-jsonl: "~/.khoj/content/markdown/markdown.jsonl.gz"
|
|
|
|
embeddings-file: "~/.khoj/content/markdown/markdown_embeddings.pt"
|
2022-07-21 19:54:30 +02:00
|
|
|
|
2021-08-23 06:54:49 +02:00
|
|
|
ledger:
|
2022-08-04 21:57:35 +02:00
|
|
|
input-files: # ["/path/to/ledger-file.beancount"] REQUIRED IF input-filter is not set OR
|
2023-01-09 02:40:18 +01:00
|
|
|
input-filter: # ["/path/to/ledger/*.beancount"] REQUIRED IF input-files is not set
|
2022-08-04 21:57:35 +02:00
|
|
|
compressed-jsonl: "~/.khoj/content/ledger/ledger.jsonl.gz"
|
|
|
|
embeddings-file: "~/.khoj/content/ledger/ledger_embeddings.pt"
|
2021-08-23 06:54:49 +02:00
|
|
|
|
2022-08-04 21:57:35 +02:00
|
|
|
image:
|
2023-01-09 02:40:18 +01:00
|
|
|
input-directories: # ["/path/to/images/"] REQUIRED IF input-filter IS NOT SET OR
|
|
|
|
input-filter: # ["/path/to/images/*.jpg"] REQUIRED IF input-directories IS NOT SET
|
2022-08-04 21:57:35 +02:00
|
|
|
embeddings-file: "~/.khoj/content/image/image_embeddings.pt"
|
|
|
|
batch-size: 50
|
2022-08-18 22:10:33 +02:00
|
|
|
use-xmp-metadata: false
|
2021-10-03 01:11:27 +02:00
|
|
|
|
|
|
|
music:
|
2023-01-09 02:40:18 +01:00
|
|
|
input-files: # ["/path/to/music-file.org"] REQUIRED IF input-filter IS NOT SET OR
|
|
|
|
input-filter: # ["/path/to/music/*.org"] REQUIRED IF input-files IS NOT SET
|
2022-08-04 21:57:35 +02:00
|
|
|
compressed-jsonl: "~/.khoj/content/music/music.jsonl.gz"
|
|
|
|
embeddings-file: "~/.khoj/content/music/music_embeddings.pt"
|
2021-08-23 06:54:49 +02:00
|
|
|
|
2021-08-22 03:47:55 +02:00
|
|
|
search-type:
|
2022-01-14 22:46:56 +01:00
|
|
|
symmetric:
|
2022-07-18 18:16:40 +02:00
|
|
|
encoder: "sentence-transformers/all-MiniLM-L6-v2"
|
2022-01-14 22:46:56 +01:00
|
|
|
cross-encoder: "cross-encoder/ms-marco-MiniLM-L-6-v2"
|
2023-01-09 02:07:13 +01:00
|
|
|
encoder-type: sentence_transformers.SentenceTransformer
|
2022-08-04 21:57:35 +02:00
|
|
|
model_directory: "~/.khoj/search/symmetric/"
|
2022-01-14 22:46:56 +01:00
|
|
|
|
2021-08-22 03:47:55 +02:00
|
|
|
asymmetric:
|
2022-07-18 18:00:19 +02:00
|
|
|
encoder: "sentence-transformers/multi-qa-MiniLM-L6-cos-v1"
|
2021-08-22 03:47:55 +02:00
|
|
|
cross-encoder: "cross-encoder/ms-marco-MiniLM-L-6-v2"
|
2023-01-09 02:07:13 +01:00
|
|
|
encoder-type: sentence_transformers.SentenceTransformer
|
2022-08-04 21:57:35 +02:00
|
|
|
model_directory: "~/.khoj/search/asymmetric/"
|
2021-08-23 06:54:49 +02:00
|
|
|
|
|
|
|
image:
|
2022-08-04 21:57:35 +02:00
|
|
|
encoder: "sentence-transformers/clip-ViT-B-32"
|
2023-01-09 02:07:13 +01:00
|
|
|
encoder-type: sentence_transformers.SentenceTransformer
|
2022-08-04 21:57:35 +02:00
|
|
|
model_directory: "~/.khoj/search/image/"
|
2021-11-26 20:56:26 +01:00
|
|
|
|
|
|
|
processor:
|
|
|
|
conversation:
|
2022-08-04 21:57:35 +02:00
|
|
|
openai-api-key: # "YOUR_OPENAI_API_KEY"
|
2023-01-09 04:08:03 +01:00
|
|
|
model: "text-davinci-003"
|
2022-08-04 21:57:35 +02:00
|
|
|
conversation-logfile: "~/.khoj/processor/conversation/conversation_logs.json"
|