-
Notifications
You must be signed in to change notification settings - Fork 0
/
csv-pdf.py
67 lines (58 loc) · 2.24 KB
/
csv-pdf.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
import os
import pandas as pd
from reportlab.lib import colors
from reportlab.lib.pagesizes import letter
from reportlab.platypus import SimpleDocTemplate, Table, TableStyle
def create_table(data):
data_list = [data.columns.tolist()] + data.values.tolist()
table = Table(data_list)
table.setStyle(TableStyle([
('BACKGROUND', (0, 0), (-1, 0), colors.gray),
('TEXTCOLOR', (0, 0), (-1, 0), colors.whitesmoke),
('ALIGN', (0, 0), (-1, -1), 'CENTER'),
('FONTNAME', (0, 0), (-1, 0), 'Helvetica-Bold'),
('BOTTOMPADDING', (0, 0), (-1, 0), 12),
('BACKGROUND', (0, 1), (-1, -1), colors.beige),
('GRID', (0, 0), (-1, -1), 1, colors.black),
('VALIGN', (0, 0), (-1, -1), 'MIDDLE')
]))
return table
def parse_csv_sections(file_path):
# Open and read the file line by line
with open(file_path, 'r') as file:
lines = file.readlines()
# Find the dividing line based on empty line or format change
sections = []
current_section = []
for line in lines:
if line.strip() == "":
if current_section:
sections.append(current_section)
current_section = []
else:
current_section.append(line)
if current_section:
sections.append(current_section)
return sections
def csv_to_pdf(csv_file_path, pdf_file_path):
sections = parse_csv_sections(csv_file_path)
pdf = SimpleDocTemplate(pdf_file_path, pagesize=letter)
elements = []
for section in sections:
# Convert section list back to a CSV string
section_csv = ''.join(section)
from io import StringIO
data = pd.read_csv(StringIO(section_csv))
table = create_table(data)
elements.append(table)
pdf.build(elements)
def process_all_csvs(directory):
for filename in os.listdir(directory):
if filename.endswith('.csv'):
csv_file_path = os.path.join(directory, filename)
pdf_file_path = os.path.join(directory, filename.replace('.csv', '.pdf'))
csv_to_pdf(csv_file_path, pdf_file_path)
print(f'Converted {filename} to PDF.')
# Example usage
source_folder = '/Users/agi/Dropbox/Taxes_2023/BOA'
process_all_csvs(source_folder)