khoj/sample_config.yml
Debanjum Singh Solanky 3e889760c7 Merge sample_config, docker_sample_config yml into a single sample_config.yml
- Update readme to indicate how to update the new sample_config to run on test data
2022-01-29 01:32:12 -05:00

47 lines
No EOL
1.5 KiB
YAML

content-type:
# The /data/folder/ prefix to the folders is here because this is
# the directory to which the local files are copied in the docker-compose.
# If changing, the docker-compose volumes should also be changed to match.
org:
input-files: null
input-filter: "/data/notes/*.org"
compressed-jsonl: "/data/generated/notes.json.gz"
embeddings-file: "/data/generated/note_embeddings.pt"
ledger:
input-files: null
input-filter: /data/ledger/*.beancount
compressed-jsonl: /data/generated/transactions.jsonl.gz
embeddings-file: /data/generated/transaction_embeddings.pt
image:
input-directory: "/data/images/"
embeddings-file: "/data/generated/image_embeddings.pt"
batch-size: 50
use-xmp-metadata: true
music:
input-files: ["/data/music/music.org"]
input-filter: null
compressed-jsonl: "/data/generated/songs.jsonl.gz"
embeddings-file: "/data/generated/song_embeddings.pt"
search-type:
symmetric:
encoder: "sentence-transformers/paraphrase-MiniLM-L6-v2"
cross-encoder: "cross-encoder/ms-marco-MiniLM-L-6-v2"
model_directory: "/data/models/symmetric"
asymmetric:
encoder: "sentence-transformers/msmarco-MiniLM-L-6-v3"
cross-encoder: "cross-encoder/ms-marco-MiniLM-L-6-v2"
model_directory: "/data/models/asymmetric"
image:
encoder: "clip-ViT-B-32"
model_directory: "/data/models/image_encoder"
processor:
conversation:
openai-api-key: null
conversation-logfile: "/data/generated/conversation_logs.json"