mirror of
https://github.com/khoj-ai/khoj.git
synced 2024-11-27 17:35:07 +01:00
Encode jsonl data as utf8 for gzip write for consistent read/write encoding
Should help with issue #89
This commit is contained in:
parent
c156b3e087
commit
11517ba8eb
1 changed files with 1 additions and 1 deletions
|
@ -51,7 +51,7 @@ def compress_jsonl_data(jsonl_data, output_path):
|
||||||
# Create output directory, if it doesn't exist
|
# Create output directory, if it doesn't exist
|
||||||
output_path.parent.mkdir(parents=True, exist_ok=True)
|
output_path.parent.mkdir(parents=True, exist_ok=True)
|
||||||
|
|
||||||
with gzip.open(output_path, 'wt') as gzip_file:
|
with gzip.open(output_path, 'wt', encoding='utf-8') as gzip_file:
|
||||||
gzip_file.write(jsonl_data)
|
gzip_file.write(jsonl_data)
|
||||||
|
|
||||||
logger.info(f'Wrote jsonl data to gzip compressed jsonl at {output_path}')
|
logger.info(f'Wrote jsonl data to gzip compressed jsonl at {output_path}')
|
Loading…
Reference in a new issue