2022-08-04 21:40:16 +02:00
|
|
|
content-type:
|
|
|
|
# The /data/folder/ prefix to the folders is here because this is
|
|
|
|
# the directory to which the local files are copied in the docker-compose.
|
|
|
|
# If changing, the docker-compose volumes should also be changed to match.
|
|
|
|
org:
|
|
|
|
input-files: null
|
2023-02-07 00:57:06 +01:00
|
|
|
input-filter: ["/data/org/**/*.org"]
|
2022-08-04 21:40:16 +02:00
|
|
|
compressed-jsonl: "/data/embeddings/notes.jsonl.gz"
|
|
|
|
embeddings-file: "/data/embeddings/note_embeddings.pt"
|
2022-09-11 16:30:02 +02:00
|
|
|
index_heading_entries: false
|
2022-08-04 21:40:16 +02:00
|
|
|
|
|
|
|
markdown:
|
|
|
|
input-files: null
|
2023-06-29 20:55:18 +02:00
|
|
|
input-filter: ["/data/markdown/**/*.markdown"]
|
2022-08-04 21:40:16 +02:00
|
|
|
compressed-jsonl: "/data/embeddings/markdown.jsonl.gz"
|
|
|
|
embeddings-file: "/data/embeddings/markdown_embeddings.pt"
|
|
|
|
|
2023-07-30 10:48:18 +02:00
|
|
|
pdf:
|
2022-08-04 21:40:16 +02:00
|
|
|
input-files: null
|
2023-07-30 10:48:18 +02:00
|
|
|
input-filter: ["/data/pdf/**/*.pdf"]
|
|
|
|
compressed-jsonl: "/data/embeddings/pdf.jsonl.gz"
|
|
|
|
embeddings-file: "/data/embeddings/pdf_embeddings.pt"
|
2022-08-04 21:40:16 +02:00
|
|
|
|
2022-09-08 09:42:34 +02:00
|
|
|
image:
|
|
|
|
input-directories: ["/data/images/"]
|
|
|
|
embeddings-file: "/data/embeddings/image_embeddings.pt"
|
|
|
|
batch-size: 50
|
|
|
|
use-xmp-metadata: false
|
2022-08-04 21:40:16 +02:00
|
|
|
|
2023-07-30 10:48:18 +02:00
|
|
|
notion: null
|
|
|
|
github: null
|
|
|
|
plugins: null
|
2022-08-04 21:40:16 +02:00
|
|
|
|
|
|
|
search-type:
|
2023-07-30 10:48:18 +02:00
|
|
|
symmetric: null
|
2022-08-04 21:40:16 +02:00
|
|
|
asymmetric:
|
|
|
|
encoder: "sentence-transformers/multi-qa-MiniLM-L6-cos-v1"
|
|
|
|
cross-encoder: "cross-encoder/ms-marco-MiniLM-L-6-v2"
|
|
|
|
model_directory: "/data/models/asymmetric"
|
|
|
|
image:
|
|
|
|
encoder: "sentence-transformers/clip-ViT-B-32"
|
|
|
|
model_directory: "/data/models/image_encoder"
|
|
|
|
|
|
|
|
processor:
|
2023-07-30 10:48:18 +02:00
|
|
|
conversation:
|
|
|
|
conversation-logfile: "/data/embeddings/conversation_logs.json"
|
|
|
|
enable-offline-chat: false
|
2023-07-30 11:07:33 +02:00
|
|
|
openai: null
|
2023-07-30 10:48:18 +02:00
|
|
|
|
|
|
|
app:
|
|
|
|
should_log_telemetry: true
|