-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathsa_raw.py
68 lines (62 loc) · 1.77 KB
/
sa_raw.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
"""
This module demonstrates the use of SQLAlchemy for executing raw SQL queries
directly. The example provided queries an enterprise database for information
about employees and their departments, specifically focusing on those within
the Engineering department.
"""
import csv
from typing import Any
# import pandas as pd
from sqlalchemy import CursorResult, Engine, TextClause, create_engine, text
engine: Engine = create_engine(
"postgresql://user:Password123@0.0.0.0:5432/data_science_prd",
)
text_clause: TextClause = text(
"""
SELECT
employees.name,
departments.name AS department,
COUNT(projects.id) AS project_count,
AVG(salaries.amount) AS average_salary
FROM
employees
JOIN
departments ON employees.department_id = departments.id
LEFT JOIN
projects ON projects.employee_id = employees.id
JOIN
salaries ON employees.id = salaries.employee_id
WHERE
departments.name = 'Engineering'
GROUP BY
employees.name, departments.name
HAVING
COUNT(projects.id) > 5
ORDER BY
average_salary DESC;
"""
)
with engine.connect() as connection:
cursor_result: CursorResult[Any] = connection.execute(
text_clause,
)
data: list[tuple[Any, ...]] = [tuple(row) for row in cursor_result]
# [(1, "A", 54.4,), (2, "ASDA", 0.42, ), (...), (), (), (), (), (), ... ]
for record in data:
print(record)
file_header: list[str] = [
"EMPLOYEE_NAME",
"DEPARTMENT",
"PROJECT_COUNT",
"AVERAGE_SALARY",
]
filename: str = "data.csv"
with open(filename, "w") as text_io_wrapper:
writer = csv.writer(
text_io_wrapper,
)
writer.writerow(file_header)
for record in data:
writer.writerow(record)
# Another option with Pandas
# dataframe: pd.DataFrame = pd.DataFrame(data, columns=file_header,)