Update khoj docker config to index sub directories for text content

- Khoj supports indexing subdirectories but the khoj docker config
  wasn't updated to support the same
- This should also allow khoj docker users to index multiple separate
  directory trees by mounting them into separate sub folders within
  /data/<content-type>/.
  For e.g /data/org/dir1, /data/org/dir2 etc in khoj_docker.yml
This commit is contained in:
Debanjum Singh Solanky 2023-02-06 20:57:06 -03:00
parent 66dca6cf33
commit 11a18cc452

View file

@ -4,20 +4,20 @@ content-type:
# If changing, the docker-compose volumes should also be changed to match. # If changing, the docker-compose volumes should also be changed to match.
org: org:
input-files: null input-files: null
input-filter: ["/data/org/*.org"] input-filter: ["/data/org/**/*.org"]
compressed-jsonl: "/data/embeddings/notes.jsonl.gz" compressed-jsonl: "/data/embeddings/notes.jsonl.gz"
embeddings-file: "/data/embeddings/note_embeddings.pt" embeddings-file: "/data/embeddings/note_embeddings.pt"
index_heading_entries: false index_heading_entries: false
markdown: markdown:
input-files: null input-files: null
input-filter: ["/data/markdown/*.md"] input-filter: ["/data/markdown/**/*.md"]
compressed-jsonl: "/data/embeddings/markdown.jsonl.gz" compressed-jsonl: "/data/embeddings/markdown.jsonl.gz"
embeddings-file: "/data/embeddings/markdown_embeddings.pt" embeddings-file: "/data/embeddings/markdown_embeddings.pt"
ledger: ledger:
input-files: null input-files: null
input-filter: ["/data/ledger/*.beancount"] input-filter: ["/data/ledger/**/*.beancount"]
compressed-jsonl: /data/embeddings/transactions.jsonl.gz compressed-jsonl: /data/embeddings/transactions.jsonl.gz
embeddings-file: /data/embeddings/transaction_embeddings.pt embeddings-file: /data/embeddings/transaction_embeddings.pt