From 97d1df0cd10f9f4adc1991cc8067cc8f1d3978cf Mon Sep 17 00:00:00 2001 From: Raghuram Subramani <raghus2247@gmail.com> Date: Thu, 27 Mar 2025 23:50:36 +0530 Subject: [PATCH] add create named pdfs --- scrape_ecourtindia_v6/create_named_pdfs.py | 25 +++++++++++++++++++++++++ 1 file changed, 25 insertions(+) diff --git a/scrape_ecourtindia_v6/create_named_pdfs.py b/scrape_ecourtindia_v6/create_named_pdfs.py new file mode 100644 index 0000000..c47c66e 100644 --- /dev/null +++ a/scrape_ecourtindia_v6/create_named_pdfs.py @@ -1,0 +1,25 @@ +import re +import shutil +from tinydb import TinyDB + +def sanitize_filename(filename): + filename = re.sub(r'[<>:"/\\|?*()]', '_', filename) + filename = re.sub(r'_+', '_', filename) + filename = filename.strip('_ ') + + return filename + +db = TinyDB('orders.json') +entries = db.all() + +for entry in entries: + date = sanitize_filename(entry['date']) + case_info = sanitize_filename(entry['case_info']) + court_name = sanitize_filename(entry['court_name']) + + newname = f"named_pdf/{date}---{case_info}---{court_name}.pdf" + + try: + shutil.copyfile(entry['filename'], newname) + except Exception as e: + print(f"Error copying {entry['filename']}: {e}") -- rgit 0.1.5