aboutsummaryrefslogtreecommitdiff
path: root/scrape_ecourtindia_v6/create_named_pdfs.py
blob: c47c66efd505ff4708ac5624c99080a63e19e27b (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
import re
import shutil
from tinydb import TinyDB

def sanitize_filename(filename):
    filename = re.sub(r'[<>:"/\\|?*()]', '_', filename)
    filename = re.sub(r'_+', '_', filename)
    filename = filename.strip('_ ')
    
    return filename

db = TinyDB('orders.json')
entries = db.all()

for entry in entries:
    date = sanitize_filename(entry['date'])
    case_info = sanitize_filename(entry['case_info'])
    court_name = sanitize_filename(entry['court_name'])
    
    newname = f"named_pdf/{date}---{case_info}---{court_name}.pdf"
    
    try:
        shutil.copyfile(entry['filename'], newname)
    except Exception as e:
        print(f"Error copying {entry['filename']}: {e}")