File size: 754 Bytes
53c9473
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
import os
import pandas as pd
import re

# Define the folder path containing the files
caps_folder = "./CAPS"

# List all files in the CAPS folder
files = os.listdir(caps_folder)

# Define a regex pattern to extract city, state, year, and plan type
pattern = re.compile(r"^(.*?),\s([A-Z]{2})\s(.{3,}?)\s(\d{4})\.pdf$")

# Extract information from file names
data = []
for file in files:
    match = pattern.match(file)
    if match:
        city, state, plan_type, year = match.groups()
        data.append([city.strip(), state, year, plan_type.strip()])

# Convert to DataFrame
df = pd.DataFrame(data, columns=["City", "State", "Year", "Plan Type"])

# Save to CSV
df.to_csv("./caps_plans.csv", index=False)

print(f"CSV file saved to: caps_plans.csv")