diff --git a/scripts/nsa/save_pages_from_db_to_file.py b/scripts/nsa/save_pages_from_db_to_file.py index 1c5de09..38c2965 100644 --- a/scripts/nsa/save_pages_from_db_to_file.py +++ b/scripts/nsa/save_pages_from_db_to_file.py @@ -19,7 +19,7 @@ def fetch_documents(collection, batch_size=5000): def write_to_parquet_in_chunks(file_path, collection, batch_size=5000, chunk_size=50000): - file_path.mkdir(parents=True, exist_ok=True) + file_path.parent.mkdir(parents=True, exist_ok=True) buffer = [] chunk_index = 0