Census of Drug and Alcohol Treatment Services in Northern Ireland:Breakdown by Service Type

In [1]:
from gssutils import *
if is_interactive():
    import requests
    from cachecontrol import CacheControl
    from cachecontrol.caches.file_cache import FileCache
    from cachecontrol.heuristics import LastModified
    from pathlib import Path

    session = CacheControl(requests.Session(),
                           cache=FileCache('.cache'),
                           heuristic=LastModified())

    sourceFolder = Path('in')
    sourceFolder.mkdir(exist_ok=True)

    inputURL = 'https://www.health-ni.gov.uk/sites/default/files/publications/dhssps/data-census-drug-alcohol-treatment-services.xlsx'
    inputFile = sourceFolder / 'data-census-drug-alcohol-treatment-services.xlsx'
    response = session.get(inputURL)
    with open(inputFile, 'wb') as f:
      f.write(response.content)
    tab = loadxlstabs(inputFile, sheetids='Table 2')[0]

Loading in/data-census-drug-alcohol-treatment-services.xlsx which has size 46265 bytes
Table names: ['Table 2']


In [2]:
observations = tab.excel_ref('B5').expand(DOWN).expand(RIGHT).is_not_blank() - tab.excel_ref('B12').expand(DOWN).expand(RIGHT)  


In [3]:
observations

{<G7 1501.0>, <M7 685.0>, <H8 0.0>, <B6 1069.0>, <I7 153.0>, <J7 172.0>, <D8 167.0>, <H7 360.0>, <C10 38.2>, <D11 16.2>, <F6 2326.0>, <M10 36.6>, <J8 11.0>, <B9 68.2>, <E10 81.8>, <G6 2422.0>, <I6 387.0>, <M9 62.9>, <K11 0.6>, <G10 36.7>, <H6 650.0>, <K8 11.0>, <K5 185.0>, <I10 28.3>, <C8 0.0>, <F9 65.2>, <C5 1496.0>, <F5 3567.0>, <E9 18.2>, <H11 0.0>, <K6 35.0>, <B8 5.0>, <G8 172.0>, <H5 1010.0>, <K9 18.9>, <K7 148.0>, <K10 80.0>, <C6 925.0>, <H9 64.4>, <D6 428.0>, <E7 432.0>, <C11 0.0>, <I5 540.0>, <J6 141.0>, <J5 324.0>, <G5 4095.0>, <H10 35.6>, <C9 61.8>, <F8 172.0>, <F10 30.0>, <I11 0.0>, <I9 71.7>, <B5 1567.0>, <L6 1143.0>, <D10 42.3>, <M6 1178.0>, <D7 437.0>, <F11 4.8>, <L7 537.0>, <M11 0.6>, <L10 31.8>, <G9 59.1>, <J10 53.1>, <I8 0.0>, <C7 571.0>, <E11 0.0>, <L5 1689.0>, <M8 11.0>, <J11 3.4>, <J9 43.5>, <E8 0.0>, <G11 4.2>, <L9 67.7>, <E5 528.0>, <D5 1032.0>, <B7 493.0>, <B10 31.5>, <D9 41.5>, <B11 0.3>, <M5 1874.0>, <E6 96.0>, <F7 1069.0>}

In [4]:
Service = tab.excel_ref('A5').expand(DOWN).is_not_blank()
Service

{<A17 'Non-statutory'>, <A6 'Statutory'>, <A19 'Statutory (%)'>, <A11 'Prison (%)'>, <A8 'Prison'>, <A9 'Statutory (%)'>, <A15 'Total'>, <A5 'Total'>, <A21 'Prison (%)'>, <A16 'Statutory'>, <A20 'Non-statutory (%)'>, <A10 'Non-statutory (%)'>, <A13 'Service Type'>, <A7 'Non-statutory'>, <A18 'Prison'>}

In [5]:
Treatment = tab.excel_ref('B4').expand(RIGHT).is_not_blank()
Treatment

{<J4 'Drugs & Alcohol'>, <F4 '18 and over'>, <D4 'Drugs & Alcohol'>, <L4 '18 and over'>, <M4 'Total'>, <G4 'Total'>, <C4 'Drugs Only'>, <I4 'Drugs Only'>, <K4 'Under 18s'>, <H4 'Alcohol Only'>, <B4 'Alcohol Only'>, <E4 'Under 18s'>}

In [6]:
sex = tab.excel_ref('B3').expand(RIGHT).is_not_blank()
sex

{<H3 'Female  '>, <B3 'Male'>}

In [7]:
Dimensions = [
            HDim(Treatment,'Treatment Type',DIRECTLY,ABOVE),
            HDim(Service,'Category',DIRECTLY,LEFT),
            HDim(sex,'Sex',CLOSEST,LEFT),
            HDimConst('Measure Type', 'Count'),
            HDimConst('Unit','People'),
            HDimConst('Period','2006-2016'),
            HDimConst('Age','All')
            ]

In [8]:
c1 = ConversionSegment(observations, Dimensions, processTIMEUNIT=True)
# savepreviewhtml(c1)

In [9]:
new_table = c1.topandas()
new_table




Unnamed: 0,OBS,Treatment Type,Category,Sex,Measure Type,Unit,Period,Age
0,1567.0,Alcohol Only,Total,Male,Count,People,2006-2016,All
1,1496.0,Drugs Only,Total,Male,Count,People,2006-2016,All
2,1032.0,Drugs & Alcohol,Total,Male,Count,People,2006-2016,All
3,528.0,Under 18s,Total,Male,Count,People,2006-2016,All
4,3567.0,18 and over,Total,Male,Count,People,2006-2016,All
5,4095.0,Total,Total,Male,Count,People,2006-2016,All
6,1010.0,Alcohol Only,Total,Female,Count,People,2006-2016,All
7,540.0,Drugs Only,Total,Female,Count,People,2006-2016,All
8,324.0,Drugs & Alcohol,Total,Female,Count,People,2006-2016,All
9,185.0,Under 18s,Total,Female,Count,People,2006-2016,All


In [10]:
new_table.columns = ['Value' if x=='OBS' else x for x in new_table.columns]

In [11]:
new_table.dtypes

Value             float64
Treatment Type     object
Category           object
Sex                object
Measure Type       object
Unit               object
Period             object
Age                object
dtype: object

In [12]:
new_table.tail(5)

Unnamed: 0,Value,Treatment Type,Category,Sex,Measure Type,Unit,Period,Age
77,0.0,Alcohol Only,Prison (%),Female,Count,People,2006-2016,All
78,0.0,Drugs Only,Prison (%),Female,Count,People,2006-2016,All
79,3.4,Drugs & Alcohol,Prison (%),Female,Count,People,2006-2016,All
80,0.6,Under 18s,Prison (%),Female,Count,People,2006-2016,All
81,0.6,Total,Prison (%),Female,Count,People,2006-2016,All


In [13]:
new_table.count()

Value             82
Treatment Type    82
Category          82
Sex               82
Measure Type      82
Unit              82
Period            82
Age               82
dtype: int64

In [14]:
new_table = new_table[new_table['Value'] !=  0 ]

In [15]:
new_table.count()

Value             74
Treatment Type    74
Category          74
Sex               74
Measure Type      74
Unit              74
Period            74
Age               74
dtype: int64

In [16]:
new_table = new_table[['Period','Category','Age','Sex','Treatment Type','Measure Type','Value','Unit']]

In [17]:
new_table.head(5)

Unnamed: 0,Period,Category,Age,Sex,Treatment Type,Measure Type,Value,Unit
0,2006-2016,Total,All,Male,Alcohol Only,Count,1567.0,People
1,2006-2016,Total,All,Male,Drugs Only,Count,1496.0,People
2,2006-2016,Total,All,Male,Drugs & Alcohol,Count,1032.0,People
3,2006-2016,Total,All,Male,Under 18s,Count,528.0,People
4,2006-2016,Total,All,Male,18 and over,Count,3567.0,People
