In [1]:
import ReportTimerange as rtr
import ReportMailer as rm
import GuestbookDbConnect as gdb

In [2]:
# Install a conda package in the current Jupyter kernel
import sys
!{sys.executable} -m pip install xlsxwriter



# Reporting Period #
* PD - yesterday
* PW - previous week
* PM - previous month
* PQ - previous quarter
* PY - previous calendar year
* YTD year to date
* WTD current week to date
* TODAY today
* P90 - previous 90days

In [3]:
acronyms = [ "PD", "PW", "PM", "PQ", "PY", "YTD", "WTD", "TODAY", "P90"]
friendly = [ "Prior Day", "Prior Week", "Prior Month", "Prior Quarter", "Prior Year", "Year to Date", "Week to Date", "Today", "Previous 90 days"]

def toPeriodFriendly(INTERVAL):
    for n in range(0, len(acronyms)):
      if INTERVAL==acronyms[n]:
         return friendly[n]
    return "Unknown Period"

In [4]:
_INTERVAL = "PQ"

In [5]:
from pandas import ExcelWriter
from pandas import ExcelFile
import xlsxwriter
import datetime

def createSpreadsheetAndMailIt(collections, reportname, recipients, subject, body):
  now = datetime.datetime.now().strftime('%Y-%m-%d_%H%M%S')
  filename = reportname + "-" + now + ".xlsx"
  #writer = ExcelWriter(filename)
  writer = ExcelWriter(filename, engine='xlsxwriter')
  workbook = writer.book  
  print("Writing dataframe to Excel file {0}".format(filename))
  for collection in collections:
    print("Writing {} to spreadsheet".format(collection["name"]))
    collection["dataframe"].to_excel(writer, sheet_name=collection["name"], index=False)
    worksheet = writer.sheets[collection["name"]]
    if 'colwidths' in collection:
      colwidths = collection['colwidths']
      print("colwidths={}".format(colwidths))
      for n in range(0, len(colwidths)):
        col = str(chr(65 + n))
        worksheet.set_column('{}:{}'.format(col,col), colwidths[n])
    else:
      worksheet.set_column('A:A', 30)
  writer.save()
  for recipient in recipients: 
    rm.mailer(recipient, subject, body, filename)
  print("Excel/Email Done!")

In [6]:
import psycopg2 as pg
import pandas.io.sql as psql
import pandas as pd

conn = gdb.guestbookDbConnect()

Welcome to Jupyter Notebook.  You are connected to the Opportunity House guestbook database!


In [7]:
trange = rtr.timerange(_INTERVAL)
print(trange)

collections = []
summaries = []

collection = {}
collection["name"] = "Outline"

df = pd.DataFrame({"Report Tab":[ \
              "Summary", \
              "Distinct Clients", \
              "Services", \
              "Housing", \
              "Gender", \
              "Ethnicity", \
              "Veterans", \
              "New Clients"
                                 ], \
                   "Description":[ \
              "summary totals for the report period", \
              "a count of individuals served by sub-period within the period.", \
              "breakdown by service type and sub-period within the period.", \
              "breakdown by housing conditions and sub-period within the period.", \
              "breakdown by gender and sub-period within the period.", \
              "breakdown by ethnicity and sub-period within the period.", \
              "breakdown by veteran status and sub-period within the period.", \
              "a list of clients with first visit occurring in the report period."
                                 ]})

collection["dataframe"] = df 
collection["colwidths"] = [30, 100]
collections.append(collection)



df.head(1000)

[datetime.datetime(2020, 1, 1, 0, 0), datetime.datetime(2020, 3, 31, 23, 59, 59, 999999), 'YYYY-MM/DD WW']


Unnamed: 0,Report Tab,Description
0,Summary,summary totals for the report period
1,Distinct Clients,a count of individuals served by sub-period wi...
2,Services,breakdown by service type and sub-period withi...
3,Housing,breakdown by housing conditions and sub-period...
4,Gender,breakdown by gender and sub-period within the ...
5,Ethnicity,breakdown by ethnicity and sub-period within t...
6,Veterans,breakdown by veteran status and sub-period wit...
7,New Clients,a list of clients with first visit occurring i...


## Total distinct clients in report period ##

In [8]:
summary = {}
summary["name"] = "Total distinct clients in report period"

query = "SELECT min(timestamp)AS start, max(timestamp) AS end, \
         COUNT(DISTINCT person_id) AS clients FROM guestbook_personsnapshot \
         WHERE timestamp BETWEEN '{}' AND '{}'".format(trange[0], trange[1])

print(query)

data = pd.read_sql(query, conn)

summary["count"] = data.iloc[0,2]
summaries.append(summary)
print(summaries)

data.head(100)

SELECT min(timestamp)AS start, max(timestamp) AS end,          COUNT(DISTINCT person_id) AS clients FROM guestbook_personsnapshot          WHERE timestamp BETWEEN '2020-01-01 00:00:00' AND '2020-03-31 23:59:59.999999'
[{'name': 'Total distinct clients in report period', 'count': 256}]


Unnamed: 0,start,end,clients
0,2020-01-02 13:28:00.745733+00:00,2020-03-19 12:33:20.456309+00:00,256


# Distinct clients by sub-interval within the report period #
* Statistics focused on the breadth of individuals that are served during the time period.

In [9]:
collection = {}
collection["name"] = "Distinct Clients"

query = "SELECT to_char(timestamp,'{}') AS period,  \
         COUNT(DISTINCT person.idperson) AS clients \
         FROM guestbook_personsnapshot snapshot \
         JOIN guestbook_person person ON person.idperson=snapshot.person_id \
         WHERE timestamp BETWEEN '{}' AND '{}' \
         GROUP BY period".format(trange[2], trange[0], trange[1])
print(query)

data = pd.read_sql(query, conn)
#data.head(1000)

persons = data.pivot_table('clients', index=['period']).fillna(0).astype(int).reset_index('period')

collection["dataframe"] = persons 
collection["colwidths"] = [30, 20]
collections.append(collection)
persons.head(1000)

SELECT to_char(timestamp,'YYYY-MM/DD WW') AS period,           COUNT(DISTINCT person.idperson) AS clients          FROM guestbook_personsnapshot snapshot          JOIN guestbook_person person ON person.idperson=snapshot.person_id          WHERE timestamp BETWEEN '2020-01-01 00:00:00' AND '2020-03-31 23:59:59.999999'          GROUP BY period


Unnamed: 0,period,clients
0,2020-01/02 01,27
1,2020-01/03 01,25
2,2020-01/06 01,33
3,2020-01/07 01,31
4,2020-01/09 02,35
5,2020-01/10 02,37
6,2020-01/13 02,28
7,2020-01/14 02,31
8,2020-01/15 03,38
9,2020-01/16 03,34


## Total Services delivered in report period ##

In [10]:
query = "SELECT \
         left(service.name, strpos(service.name, '/') - 1) AS servicename, COUNT(*) AS total FROM guestbook_personsnapshot snapshot\
         JOIN guestbook_personservicerequest servicerequest ON servicerequest.connection_id=snapshot.idsnapshot \
         JOIN guestbook_service service ON service.idservice=servicerequest.service_id \
         WHERE timestamp BETWEEN '{}' AND '{}'  AND service.points<=0 \
         GROUP BY servicename \
         ORDER BY total desc".format(trange[0], trange[1])

print(query)

data = pd.read_sql(query, conn)


for n in range(0, data.shape[0]):  
  summary = {}
  summary["name"]  = data.iloc[n,0] + " services delivered."
  summary["count"] = data.iloc[n,1]
  summaries.append(summary)
print(summaries)
data.head(1000)

SELECT          left(service.name, strpos(service.name, '/') - 1) AS servicename, COUNT(*) AS total FROM guestbook_personsnapshot snapshot         JOIN guestbook_personservicerequest servicerequest ON servicerequest.connection_id=snapshot.idsnapshot          JOIN guestbook_service service ON service.idservice=servicerequest.service_id          WHERE timestamp BETWEEN '2020-01-01 00:00:00' AND '2020-03-31 23:59:59.999999'  AND service.points<=0          GROUP BY servicename          ORDER BY total desc
[{'name': 'Total distinct clients in report period', 'count': 256}, {'name': 'Meals services delivered.', 'count': 1275}, {'name': 'Shower services delivered.', 'count': 322}, {'name': 'Clothing services delivered.', 'count': 245}, {'name': 'Computer services delivered.', 'count': 197}, {'name': 'Laundry services delivered.', 'count': 136}, {'name': 'Nurse services delivered.', 'count': 106}, {'name': 'Pastor Consultation services delivered.', 'count': 100}]


Unnamed: 0,servicename,total
0,Meals,1275
1,Shower,322
2,Clothing,245
3,Computer,197
4,Laundry,136
5,Nurse,106
6,Pastor Consultation,100


# Services delivered by sub-interval within the report period #

In [11]:
collection = {}
collection["name"] = "Services"

#query = "SELECT to_char(timestamp,'{}') AS period, \
#         service.name AS servicename, COUNT(*) AS total FROM guestbook_personsnapshot snapshot\
#         JOIN guestbook_personservicerequest servicerequest ON servicerequest.connection_id=snapshot.idsnapshot \
#         JOIN guestbook_service service ON service.idservice=servicerequest.service_id \
#         WHERE timestamp BETWEEN '{}' AND '{}' \
#         GROUP BY period, servicename".format(trange[2], trange[0], trange[1])

query = "SELECT to_char(timestamp,'{}') AS period, \
         left(service.name, strpos(service.name, '/') - 1) AS servicename, COUNT(*) AS total FROM guestbook_personsnapshot snapshot\
         JOIN guestbook_personservicerequest servicerequest ON servicerequest.connection_id=snapshot.idsnapshot \
         JOIN guestbook_service service ON service.idservice=servicerequest.service_id \
         WHERE timestamp BETWEEN '{}' AND '{}' AND service.points<=0 \
         GROUP BY period, servicename".format(trange[2], trange[0], trange[1])



print(query)

data = pd.read_sql(query, conn)

services = data.pivot_table('total', index=['period'], columns='servicename').fillna(0).astype(int).reset_index('period')
collection["dataframe"] = services 
collection["colwidths"] = [30, 20, 20, 20, 20, 20, 20, 20]
collections.append(collection)

services.head(1000)

SELECT to_char(timestamp,'YYYY-MM/DD WW') AS period,          left(service.name, strpos(service.name, '/') - 1) AS servicename, COUNT(*) AS total FROM guestbook_personsnapshot snapshot         JOIN guestbook_personservicerequest servicerequest ON servicerequest.connection_id=snapshot.idsnapshot          JOIN guestbook_service service ON service.idservice=servicerequest.service_id          WHERE timestamp BETWEEN '2020-01-01 00:00:00' AND '2020-03-31 23:59:59.999999' AND service.points<=0          GROUP BY period, servicename


servicename,period,Clothing,Computer,Laundry,Meals,Nurse,Pastor Consultation,Shower
0,2020-01/02 01,0,3,3,22,0,1,7
1,2020-01/03 01,9,4,1,22,3,0,4
2,2020-01/06 01,13,3,3,32,0,2,10
3,2020-01/07 01,0,9,5,30,8,2,6
4,2020-01/09 02,0,10,5,35,7,5,8
5,2020-01/10 02,15,8,2,31,5,5,4
6,2020-01/13 02,11,5,3,23,0,3,10
7,2020-01/14 02,0,6,6,31,4,4,10
8,2020-01/15 03,12,6,2,34,0,6,4
9,2020-01/16 03,0,4,4,29,6,3,9


# Housing totals within the report period#

In [12]:
query = "SELECT  \
         left(housing.name, strpos(housing.name, '(') - 1)  AS hresponse, COUNT(*) AS total FROM guestbook_personsnapshot snapshot\
         JOIN guestbook_personsurvey survey ON survey.connection_id=snapshot.idsnapshot \
         JOIN guestbook_housingresponse housing ON housing.idhousing=survey.object_id \
         WHERE timestamp BETWEEN '{}' AND '{}' AND prompt_id=8 \
         GROUP BY hresponse".format(trange[0], trange[1])

print(query)

data = pd.read_sql(query, conn)

for n in range(0, data.shape[0]):  
  summary = {}
  summary["name"]  = " Days spent in " + data.iloc[n,0] 
  summary["count"] = data.iloc[n,1]
  summaries.append(summary)
print(summaries)

data.head(1000)

SELECT           left(housing.name, strpos(housing.name, '(') - 1)  AS hresponse, COUNT(*) AS total FROM guestbook_personsnapshot snapshot         JOIN guestbook_personsurvey survey ON survey.connection_id=snapshot.idsnapshot          JOIN guestbook_housingresponse housing ON housing.idhousing=survey.object_id          WHERE timestamp BETWEEN '2020-01-01 00:00:00' AND '2020-03-31 23:59:59.999999' AND prompt_id=8          GROUP BY hresponse
[{'name': 'Total distinct clients in report period', 'count': 256}, {'name': 'Meals services delivered.', 'count': 1275}, {'name': 'Shower services delivered.', 'count': 322}, {'name': 'Clothing services delivered.', 'count': 245}, {'name': 'Computer services delivered.', 'count': 197}, {'name': 'Laundry services delivered.', 'count': 136}, {'name': 'Nurse services delivered.', 'count': 106}, {'name': 'Pastor Consultation services delivered.', 'count': 100}, {'name': ' Days spent in Unstable housing ', 'count': 259}, {'name': ' Days spent in Jail or 

Unnamed: 0,hresponse,total
0,Unstable housing,259
1,Jail or priso,5
2,Sheltered,230
3,Stable housing,235
4,Unsheltered,577


# Housing by sub-interval within the report period#
* Answers to the prompt 'Where did you spend last night?'

In [13]:
collection = {}
collection["name"] = "Housing"

#query = "SELECT to_char(timestamp,'{}') AS period, \
#         housing.name AS hresponse, COUNT(*) AS total FROM guestbook_personsnapshot snapshot\
#         JOIN guestbook_personsurvey survey ON survey.connection_id=snapshot.idsnapshot \
#         JOIN guestbook_housingresponse housing ON housing.idhousing=survey.object_id \
#         WHERE timestamp BETWEEN '{}' AND '{}' AND prompt_id=8 \
#         GROUP BY period, hresponse".format(trange[2], trange[0], trange[1])

query = "SELECT to_char(timestamp,'{}') AS period, \
         left(housing.name, strpos(housing.name, '(') - 1) AS hresponse, COUNT(*) AS total FROM guestbook_personsnapshot snapshot\
         JOIN guestbook_personsurvey survey ON survey.connection_id=snapshot.idsnapshot \
         JOIN guestbook_housingresponse housing ON housing.idhousing=survey.object_id \
         WHERE timestamp BETWEEN '{}' AND '{}' AND prompt_id=8 \
         GROUP BY period, hresponse".format(trange[2], trange[0], trange[1])

print(query)

data = pd.read_sql(query, conn)

housing = data.pivot_table('total', index=['period'], columns='hresponse').fillna(0).astype(int).reset_index('period')
#housing = housing.fillna(0)
collection["dataframe"] = housing  
collection["colwidths"] = [30, 30, 30, 30, 30, 30]
collections.append(collection)
housing.head(1000)

SELECT to_char(timestamp,'YYYY-MM/DD WW') AS period,          left(housing.name, strpos(housing.name, '(') - 1) AS hresponse, COUNT(*) AS total FROM guestbook_personsnapshot snapshot         JOIN guestbook_personsurvey survey ON survey.connection_id=snapshot.idsnapshot          JOIN guestbook_housingresponse housing ON housing.idhousing=survey.object_id          WHERE timestamp BETWEEN '2020-01-01 00:00:00' AND '2020-03-31 23:59:59.999999' AND prompt_id=8          GROUP BY period, hresponse


hresponse,period,Jail or priso,Sheltered,Stable housing,Unsheltered,Unstable housing
0,2020-01/02 01,0,4,2,14,3
1,2020-01/03 01,0,6,4,9,3
2,2020-01/06 01,0,5,9,12,5
3,2020-01/07 01,0,7,6,11,5
4,2020-01/09 02,0,5,4,16,6
5,2020-01/10 02,0,8,7,10,5
6,2020-01/13 02,0,7,3,11,4
7,2020-01/14 02,0,5,4,13,6
8,2020-01/15 03,1,7,4,19,5
9,2020-01/16 03,0,8,5,12,7


# Clients (by name) Reporting Unsheltered Housing #
* more than once in the report period

In [14]:
collection = {}
collection["name"] = "Unsheltered_by_Name"

unsheltered = 5
threshold = 1

#query = "SELECT to_char(timestamp,'{}') AS period, \
#         housing.name AS hresponse, COUNT(*) AS total FROM guestbook_personsnapshot snapshot\
#         JOIN guestbook_personsurvey survey ON survey.connection_id=snapshot.idsnapshot \
#         JOIN guestbook_housingresponse housing ON housing.idhousing=survey.object_id \
#         WHERE timestamp BETWEEN '{}' AND '{}' AND prompt_id=8 \
#         GROUP BY period, hresponse".format(trange[2], trange[0], trange[1])

query = "SELECT person.firstname, person.lastname, person.aliasname, \
         COUNT(*) AS unsheltered_nights FROM guestbook_personsnapshot snapshot\
         JOIN guestbook_person person ON person.idperson=snapshot.person_id \
         JOIN guestbook_personsurvey survey ON survey.connection_id=snapshot.idsnapshot \
         JOIN guestbook_housingresponse housing ON housing.idhousing=survey.object_id \
         WHERE timestamp BETWEEN '{}' AND '{}' AND prompt_id=8 AND object_id={} \
         GROUP BY person.idperson ORDER BY COUNT(*) desc".format(trange[0], trange[1], unsheltered)

print(query)

data = pd.read_sql(query, conn)
data.head(100)

#housing = data.pivot_table('total', index=['period'], columns='hresponse').fillna(0).astype(int).reset_index('period')
collection["dataframe"] = data 
collection["colwidths"] = [30, 30, 30, 30, 30, 30]
collections.append(collection)
data.head(1000)

SELECT person.firstname, person.lastname, person.aliasname,          COUNT(*) AS unsheltered_nights FROM guestbook_personsnapshot snapshot         JOIN guestbook_person person ON person.idperson=snapshot.person_id          JOIN guestbook_personsurvey survey ON survey.connection_id=snapshot.idsnapshot          JOIN guestbook_housingresponse housing ON housing.idhousing=survey.object_id          WHERE timestamp BETWEEN '2020-01-01 00:00:00' AND '2020-03-31 23:59:59.999999' AND prompt_id=8 AND object_id=5          GROUP BY person.idperson ORDER BY COUNT(*) desc


Unnamed: 0,firstname,lastname,aliasname,unsheltered_nights
0,AARON,SPIVEY,AS9512,45
1,JAMES,HUCKABY,JAMESH,42
2,RONNIE,STANCIL,RON,40
3,ANTONIO,MORRIS,TONIO,39
4,SHERYL,SHOULDERS,SHERYL,36
5,AARON,AYERS,AARONA,34
6,PAT,GILMORE,PATG,32
7,STEVE,SLOAN,STEVE,32
8,DAVID,STIREWALT,HAWK,25
9,RAVON,CRUSE,RAVON,19


# Gender totals in the report period #

In [15]:
query = "SELECT  \
         gender.name AS response, COUNT(DISTINCT person.idperson) AS total FROM guestbook_personsnapshot snapshot\
         JOIN guestbook_person person ON person.idperson=snapshot.person_id \
         JOIN guestbook_genderresponse gender ON gender.idgender=person.gender_id \
         WHERE timestamp BETWEEN '{}' AND '{}' \
         GROUP BY response".format(trange[0], trange[1])

print(query)
#summaries = []

data = pd.read_sql(query, conn)

for n in range(0, data.shape[0]):  
  summary = {}
  summary["name"]  = "Gender -" + data.iloc[n,0] 
  summary["count"] = data.iloc[n,1]
  summaries.append(summary)
print(summaries)

data.head(100)

SELECT           gender.name AS response, COUNT(DISTINCT person.idperson) AS total FROM guestbook_personsnapshot snapshot         JOIN guestbook_person person ON person.idperson=snapshot.person_id          JOIN guestbook_genderresponse gender ON gender.idgender=person.gender_id          WHERE timestamp BETWEEN '2020-01-01 00:00:00' AND '2020-03-31 23:59:59.999999'          GROUP BY response
[{'name': 'Total distinct clients in report period', 'count': 256}, {'name': 'Meals services delivered.', 'count': 1275}, {'name': 'Shower services delivered.', 'count': 322}, {'name': 'Clothing services delivered.', 'count': 245}, {'name': 'Computer services delivered.', 'count': 197}, {'name': 'Laundry services delivered.', 'count': 136}, {'name': 'Nurse services delivered.', 'count': 106}, {'name': 'Pastor Consultation services delivered.', 'count': 100}, {'name': ' Days spent in Unstable housing ', 'count': 259}, {'name': ' Days spent in Jail or priso', 'count': 5}, {'name': ' Days spent in Shel

Unnamed: 0,response,total
0,Female,42
1,Male,99
2,Unknown,115


# Gender by sub-interval within the report period #

In [16]:
collection = {}
collection["name"] = "Gender"

query = "SELECT to_char(timestamp,'{}') AS period, \
         gender.name AS response, COUNT(DISTINCT person.idperson) AS total FROM guestbook_personsnapshot snapshot\
         JOIN guestbook_person person ON person.idperson=snapshot.person_id \
         JOIN guestbook_genderresponse gender ON gender.idgender=person.gender_id \
         WHERE timestamp BETWEEN '{}' AND '{}' \
         GROUP BY period, response".format(trange[2], trange[0], trange[1])

print(query)

data = pd.read_sql(query, conn)

gender = data.pivot_table('total', index=['period'], columns='response').fillna(0).astype(int).reset_index('period')
collection["dataframe"] = gender
collection["colwidths"] = [30, 20, 20, 20]
#collection["colwidths"] = []
collections.append(collection)
gender.head(1000)

SELECT to_char(timestamp,'YYYY-MM/DD WW') AS period,          gender.name AS response, COUNT(DISTINCT person.idperson) AS total FROM guestbook_personsnapshot snapshot         JOIN guestbook_person person ON person.idperson=snapshot.person_id          JOIN guestbook_genderresponse gender ON gender.idgender=person.gender_id          WHERE timestamp BETWEEN '2020-01-01 00:00:00' AND '2020-03-31 23:59:59.999999'          GROUP BY period, response


response,period,Female,Male,Unknown
0,2020-01/02 01,4,18,5
1,2020-01/03 01,6,18,1
2,2020-01/06 01,5,23,5
3,2020-01/07 01,6,21,4
4,2020-01/09 02,5,25,5
5,2020-01/10 02,9,21,7
6,2020-01/13 02,6,18,4
7,2020-01/14 02,9,19,3
8,2020-01/15 03,7,26,5
9,2020-01/16 03,8,25,1


# Ethnicity totals within the report period #

In [17]:
query = "SELECT  \
         ethnicity.name AS response, COUNT(DISTINCT person.idperson) AS total FROM guestbook_personsnapshot snapshot\
         JOIN guestbook_person person ON person.idperson=snapshot.person_id \
         JOIN guestbook_ethnicityresponse ethnicity ON ethnicity.idethnicity=person.ethnicity_id \
         WHERE timestamp BETWEEN '{}' AND '{}' \
         GROUP BY response".format(trange[0], trange[1])

print(query)
#summaries = []

data = pd.read_sql(query, conn)
for n in range(0, data.shape[0]):  
  summary = {}
  summary["name"]  = "Ethnicity -" + data.iloc[n,0] 
  summary["count"] = data.iloc[n,1]
  summaries.append(summary)
print(summaries)
data.head(1000)

SELECT           ethnicity.name AS response, COUNT(DISTINCT person.idperson) AS total FROM guestbook_personsnapshot snapshot         JOIN guestbook_person person ON person.idperson=snapshot.person_id          JOIN guestbook_ethnicityresponse ethnicity ON ethnicity.idethnicity=person.ethnicity_id          WHERE timestamp BETWEEN '2020-01-01 00:00:00' AND '2020-03-31 23:59:59.999999'          GROUP BY response
[{'name': 'Total distinct clients in report period', 'count': 256}, {'name': 'Meals services delivered.', 'count': 1275}, {'name': 'Shower services delivered.', 'count': 322}, {'name': 'Clothing services delivered.', 'count': 245}, {'name': 'Computer services delivered.', 'count': 197}, {'name': 'Laundry services delivered.', 'count': 136}, {'name': 'Nurse services delivered.', 'count': 106}, {'name': 'Pastor Consultation services delivered.', 'count': 100}, {'name': ' Days spent in Unstable housing ', 'count': 259}, {'name': ' Days spent in Jail or priso', 'count': 5}, {'name': ' 

Unnamed: 0,response,total
0,Black,89
1,Hispanic,1
2,Native American,6
3,Other,10
4,Unknown,84
5,White,66


# Ethnicity by sub-interval within the report period #

In [18]:
collection = {}
collection["name"] = "Ethnicity"

query = "SELECT to_char(timestamp,'{}') AS period, \
         ethnicity.name AS response, COUNT(DISTINCT person.idperson) AS total FROM guestbook_personsnapshot snapshot\
         JOIN guestbook_person person ON person.idperson=snapshot.person_id \
         JOIN guestbook_ethnicityresponse ethnicity ON ethnicity.idethnicity=person.ethnicity_id \
         WHERE timestamp BETWEEN '{}' AND '{}' \
         GROUP BY period, response".format(trange[2], trange[0], trange[1])

print(query)

data = pd.read_sql(query, conn)

ethnicity = data.pivot_table('total', index=['period'], columns='response').fillna(0).astype(int).reset_index('period')
collection["dataframe"] = ethnicity 
collection["colwidths"] = [30, 20, 20, 20, 20, 20, 20, 20]
collections.append(collection)
ethnicity.head(1000)

SELECT to_char(timestamp,'YYYY-MM/DD WW') AS period,          ethnicity.name AS response, COUNT(DISTINCT person.idperson) AS total FROM guestbook_personsnapshot snapshot         JOIN guestbook_person person ON person.idperson=snapshot.person_id          JOIN guestbook_ethnicityresponse ethnicity ON ethnicity.idethnicity=person.ethnicity_id          WHERE timestamp BETWEEN '2020-01-01 00:00:00' AND '2020-03-31 23:59:59.999999'          GROUP BY period, response


response,period,Black,Hispanic,Native American,Other,Unknown,White
0,2020-01/02 01,10,1,2,1,3,10
1,2020-01/03 01,10,1,2,2,1,9
2,2020-01/06 01,11,1,4,3,4,10
3,2020-01/07 01,12,1,3,2,2,11
4,2020-01/09 02,16,1,2,2,5,9
5,2020-01/10 02,15,1,2,3,5,11
6,2020-01/13 02,18,0,3,1,1,5
7,2020-01/14 02,18,1,2,1,2,7
8,2020-01/15 03,22,1,2,2,4,7
9,2020-01/16 03,21,1,1,3,0,8


# Veteran status totals within the report period#

In [19]:
query = "SELECT  \
         yesno.name AS response, COUNT(DISTINCT person.idperson) AS total FROM guestbook_personsnapshot snapshot\
         JOIN guestbook_person person ON person.idperson=snapshot.person_id \
         JOIN guestbook_yesnoresponse yesno ON yesno.idyesno=person.veteran_id \
         WHERE timestamp BETWEEN '{}' AND '{}' \
         GROUP BY response \
         ORDER BY response desc".format(trange[0], trange[1])

print(query)
#summaries = []

data = pd.read_sql(query, conn)

for n in range(0, data.shape[0]):  
  summary = {}
  if data.iloc[n,0]=="Yes":
    summary["name"] = "Veterans"
  elif data.iloc[n,0]=="No":
    summary["name"] = "Non-veterans"
  else:
    summary["name"] = "Veteran status Unknown"
  summary["count"] = data.iloc[n,1]
  summaries.append(summary)
print(summaries)

data.head(1000)

SELECT           yesno.name AS response, COUNT(DISTINCT person.idperson) AS total FROM guestbook_personsnapshot snapshot         JOIN guestbook_person person ON person.idperson=snapshot.person_id          JOIN guestbook_yesnoresponse yesno ON yesno.idyesno=person.veteran_id          WHERE timestamp BETWEEN '2020-01-01 00:00:00' AND '2020-03-31 23:59:59.999999'          GROUP BY response          ORDER BY response desc
[{'name': 'Total distinct clients in report period', 'count': 256}, {'name': 'Meals services delivered.', 'count': 1275}, {'name': 'Shower services delivered.', 'count': 322}, {'name': 'Clothing services delivered.', 'count': 245}, {'name': 'Computer services delivered.', 'count': 197}, {'name': 'Laundry services delivered.', 'count': 136}, {'name': 'Nurse services delivered.', 'count': 106}, {'name': 'Pastor Consultation services delivered.', 'count': 100}, {'name': ' Days spent in Unstable housing ', 'count': 259}, {'name': ' Days spent in Jail or priso', 'count': 5}, {

Unnamed: 0,response,total
0,Yes,16
1,Unknown,133
2,No,107


# Veteran Status by sub-interval within the report period#

In [20]:
collection = {}
collection["name"] = "Veterans"

query = "SELECT to_char(timestamp,'{}') AS period, \
         yesno.name AS response, COUNT(DISTINCT person.idperson) AS total FROM guestbook_personsnapshot snapshot\
         JOIN guestbook_person person ON person.idperson=snapshot.person_id \
         JOIN guestbook_yesnoresponse yesno ON yesno.idyesno=person.veteran_id \
         WHERE timestamp BETWEEN '{}' AND '{}' \
         GROUP BY period, response".format(trange[2], trange[0], trange[1])

print(query)

data = pd.read_sql(query, conn)
#data.head(1000)



veterans  = data.pivot_table('total', index=['period'], columns='response').fillna(0).astype(int).reset_index('period')
veterans.columns = ['period', 'non-veteran', 'unknown','veteran']
collection["dataframe"] = veterans 
collection["colwidths"] = [30, 30, 30, 30]
collections.append(collection)
veterans.head(1000)


SELECT to_char(timestamp,'YYYY-MM/DD WW') AS period,          yesno.name AS response, COUNT(DISTINCT person.idperson) AS total FROM guestbook_personsnapshot snapshot         JOIN guestbook_person person ON person.idperson=snapshot.person_id          JOIN guestbook_yesnoresponse yesno ON yesno.idyesno=person.veteran_id          WHERE timestamp BETWEEN '2020-01-01 00:00:00' AND '2020-03-31 23:59:59.999999'          GROUP BY period, response


Unnamed: 0,period,non-veteran,unknown,veteran
0,2020-01/02 01,19,6,2
1,2020-01/03 01,20,3,2
2,2020-01/06 01,24,6,3
3,2020-01/07 01,22,6,3
4,2020-01/09 02,28,6,1
5,2020-01/10 02,26,8,3
6,2020-01/13 02,22,5,1
7,2020-01/14 02,25,5,1
8,2020-01/15 03,28,6,4
9,2020-01/16 03,28,4,2


# New Clients within the report period#
* Clients first appearing in the report interval

In [21]:
collection = {}
collection["name"] = "New Clients"

query = "SELECT firstname, lastname, aliasname, timelinestarttime::date AS startdate FROM guestbook_person \
         WHERE timelinestarttime BETWEEN '{}' AND '{}' \
         ORDER BY timelinestarttime asc".format(trange[0], trange[1])

print(query)

data = pd.read_sql(query, conn)
collection["dataframe"] = data
collection["colwidths"] = [30, 30, 30, 30]
collections.append(collection)

data.head(5000)

SELECT firstname, lastname, aliasname, timelinestarttime::date AS startdate FROM guestbook_person          WHERE timelinestarttime BETWEEN '2020-01-01 00:00:00' AND '2020-03-31 23:59:59.999999'          ORDER BY timelinestarttime asc


Unnamed: 0,firstname,lastname,aliasname,startdate
0,LISA,RUSHING,LRUSHING,2020-01-02
1,LEONARD,NJOROGE,NJOROGE,2020-01-06
2,MARTIN,SMOUTHERSON,MARTIN,2020-01-06
3,MICHELLE,JACKSON,MJACKSON,2020-01-06
4,LEVON,DOZIER,DOZIER,2020-01-06
5,JASON,BARBEE,JASONEB,2020-01-06
6,RONICA,DICKIE,RONICA,2020-01-06
7,LARRY,WADE,LWADE,2020-01-07
8,CLAYTON,RICHA4DS,TOXSIDIOUS3,2020-01-07
9,SHANE,FOSTER,SHANEF,2020-01-07


# Summary Counts #

In [22]:
collection = {}
summ = pd.DataFrame.from_dict(summaries)
collection["name"] = "Summary"
collection["dataframe"] = summ
collection["colwidths"] = [30, 60]
collections.insert(1, collection)
#collections.append(collection)
summ.head(1000)

Unnamed: 0,count,name
0,256,Total distinct clients in report period
1,1275,Meals services delivered.
2,322,Shower services delivered.
3,245,Clothing services delivered.
4,197,Computer services delivered.
5,136,Laundry services delivered.
6,106,Nurse services delivered.
7,100,Pastor Consultation services delivered.
8,259,Days spent in Unstable housing
9,5,Days spent in Jail or priso


In [23]:
_REPORTNAME = _INTERVAL
_SUBJECT = "Opportunity House - Reports for {}".format(toPeriodFriendly(_INTERVAL))
_BODY    = "Spreadsheet (attached) with reports for period {} through {}.".format(trange[0], trange[1])
_EMAIL_RECIPIENT = ['cprice9739@carolina.rr.com', 'pastor@opphouse.net']
#_EMAIL_RECIPIENT = ['cprice9739@carolina.rr.com']

createSpreadsheetAndMailIt(collections, _REPORTNAME, _EMAIL_RECIPIENT, _SUBJECT, _BODY)

Writing dataframe to Excel file PQ-2020-04-03_145911.xlsx
Writing Outline to spreadsheet
colwidths=[30, 100]
Writing Summary to spreadsheet
colwidths=[30, 60]
Writing Distinct Clients to spreadsheet
colwidths=[30, 20]
Writing Services to spreadsheet
colwidths=[30, 20, 20, 20, 20, 20, 20, 20]
Writing Housing to spreadsheet
colwidths=[30, 30, 30, 30, 30, 30]
Writing Unsheltered_by_Name to spreadsheet
colwidths=[30, 30, 30, 30, 30, 30]
Writing Gender to spreadsheet
colwidths=[30, 20, 20, 20]
Writing Ethnicity to spreadsheet
colwidths=[30, 20, 20, 20, 20, 20, 20, 20]
Writing Veterans to spreadsheet
colwidths=[30, 30, 30, 30]
Writing New Clients to spreadsheet
colwidths=[30, 30, 30, 30]
Emailer Done!
Excel/Email Done!
