2021-08-22 03:47:55 +02:00
|
|
|
content-type:
|
2022-01-29 07:32:12 +01:00
|
|
|
# The /data/folder/ prefix to the folders is here because this is
|
|
|
|
# the directory to which the local files are copied in the docker-compose.
|
|
|
|
# If changing, the docker-compose volumes should also be changed to match.
|
2021-08-22 03:47:55 +02:00
|
|
|
org:
|
2022-01-29 07:32:12 +01:00
|
|
|
input-files: null
|
|
|
|
input-filter: "/data/notes/*.org"
|
2022-01-29 10:13:36 +01:00
|
|
|
compressed-jsonl: "/data/embeddings/notes.jsonl.gz"
|
2022-01-29 09:24:02 +01:00
|
|
|
embeddings-file: "/data/embeddings/note_embeddings.pt"
|
2021-08-22 03:47:55 +02:00
|
|
|
|
2022-07-21 19:54:30 +02:00
|
|
|
markdown:
|
|
|
|
input-files: null
|
|
|
|
input-filter: "/data/markdown/*.md"
|
|
|
|
compressed-jsonl: "/data/embeddings/markdown.jsonl.gz"
|
|
|
|
embeddings-file: "/data/embeddings/markdown_embeddings.pt"
|
|
|
|
|
2021-08-23 06:54:49 +02:00
|
|
|
ledger:
|
2021-10-03 01:11:27 +02:00
|
|
|
input-files: null
|
2022-01-29 07:32:12 +01:00
|
|
|
input-filter: /data/ledger/*.beancount
|
2022-01-29 09:24:02 +01:00
|
|
|
compressed-jsonl: /data/embeddings/transactions.jsonl.gz
|
|
|
|
embeddings-file: /data/embeddings/transaction_embeddings.pt
|
2021-08-23 06:54:49 +02:00
|
|
|
|
2022-08-04 01:20:45 +02:00
|
|
|
# image:
|
|
|
|
# input-directories: ["/data/images/"]
|
|
|
|
# embeddings-file: "/data/embeddings/image_embeddings.pt"
|
|
|
|
# batch-size: 50
|
|
|
|
# use-xmp-metadata: true
|
2021-10-03 01:11:27 +02:00
|
|
|
|
|
|
|
music:
|
2022-01-29 07:32:12 +01:00
|
|
|
input-files: ["/data/music/music.org"]
|
2021-10-03 01:11:27 +02:00
|
|
|
input-filter: null
|
2022-01-29 09:24:02 +01:00
|
|
|
compressed-jsonl: "/data/embeddings/songs.jsonl.gz"
|
|
|
|
embeddings-file: "/data/embeddings/song_embeddings.pt"
|
2021-08-23 06:54:49 +02:00
|
|
|
|
2021-08-22 03:47:55 +02:00
|
|
|
search-type:
|
2022-01-14 22:46:56 +01:00
|
|
|
symmetric:
|
2022-07-18 18:16:40 +02:00
|
|
|
encoder: "sentence-transformers/all-MiniLM-L6-v2"
|
2022-01-14 22:46:56 +01:00
|
|
|
cross-encoder: "cross-encoder/ms-marco-MiniLM-L-6-v2"
|
2022-01-29 07:32:12 +01:00
|
|
|
model_directory: "/data/models/symmetric"
|
2022-01-14 22:46:56 +01:00
|
|
|
|
2021-08-22 03:47:55 +02:00
|
|
|
asymmetric:
|
2022-07-18 18:00:19 +02:00
|
|
|
encoder: "sentence-transformers/multi-qa-MiniLM-L6-cos-v1"
|
2021-08-22 03:47:55 +02:00
|
|
|
cross-encoder: "cross-encoder/ms-marco-MiniLM-L-6-v2"
|
2022-01-29 07:32:12 +01:00
|
|
|
model_directory: "/data/models/asymmetric"
|
2021-08-23 06:54:49 +02:00
|
|
|
|
|
|
|
image:
|
|
|
|
encoder: "clip-ViT-B-32"
|
2022-01-29 07:32:12 +01:00
|
|
|
model_directory: "/data/models/image_encoder"
|
2021-11-26 20:56:26 +01:00
|
|
|
|
|
|
|
processor:
|
|
|
|
conversation:
|
|
|
|
openai-api-key: null
|
2022-01-29 09:24:02 +01:00
|
|
|
conversation-logfile: "/data/embeddings/conversation_logs.json"
|