Table 4.6.1: Religion, new presentations to treatment

In [1]:
from gssutils import *

if is_interactive():
    scraper = Scraper('https://www.gov.uk/government/collections/alcohol-and-drug-misuse-and-treatment-statistics')
    scraper.select_dataset(title=lambda x: x.startswith('Substance misuse treatment for adults'), latest=True)
    tabs = {tab.name: tab for tab in scraper.distribution(title=lambda x: x.startswith('Data tables')).as_databaker()}

In [2]:
tab = tabs['Table 4.6.1']

https://assets.publishing.service.gov.uk/government/uploads/system/uploads/attachment_data/file/752515/AdultSubstanceMisuseNDTMSDataTables2017-18.xlsx

In [3]:
cell = tab.filter('Religion')
cell.assert_one()
obs = tab.filter('Inconsistent/missing').shift(0,1).expand(RIGHT)
observations = tab.filter('n').fill(DOWN).is_not_blank().is_not_whitespace() - obs
Religion = cell.expand(DOWN).is_not_blank().is_not_whitespace()
Clients = cell.expand(RIGHT).is_not_blank().is_not_whitespace()
Dimensions = [
            HDim(Religion,'Treatment group',DIRECTLY,LEFT),
            HDim(Clients,'Clients in treatment',CLOSEST,LEFT),
            HDimConst('Measure Type','count-of-new-presentations-to-treatment'),
            HDimConst('Unit','new-presentations-to-treatment'),
            HDimConst('Period', 'gregorian-interval/2017-04-01T00:00:00/P1Y')
            ]

In [4]:
c1 = ConversionSegment(observations, Dimensions, processTIMEUNIT=True)
if is_interactive():
    savepreviewhtml(c1)

0,1,2
OBS,Treatment group,Clients in treatment

0,1,2,3,4,5,6,7,8,9,10
"Table 4.6.1: Religion, new presentations to treatment",,,,,,,,,,
Link back to the index,,,,,,,,,,
Religion,Opiate,,Non-opiate only,,Non-opiate and Alcohol,,Alcohol only,,Total,
,n,%,n,%,n,%,n,%,n,%
Baha'i,8.0,0.000199024778584934,2.0,0.000129265770423992,1.0,5.67891419160657e-05,5.0,0.000101549647622723,16.0,0.000130597319490017
Buddhist,243.0,0.00604537764951736,50.0,0.00323164426059979,78.0,0.00442955306945312,169.0,0.00343237808964803,540.0,0.00440765953278809
Christian,9522.0,0.236889242710717,3126.0,0.202042399172699,3958.0,0.224771423703788,14943.0,0.303491276885269,31549.0,0.25751342703691
Hindu,138.0,0.00343317743059011,40.0,0.00258531540847983,59.0,0.00335055937304787,329.0,0.00668196681357516,566.0,0.00461988017695937
Jain,5.0,0.000124390486615584,1.0,6.46328852119959e-05,2.0,0.000113578283832131,6.0,0.000121859577147267,14.0,0.000114272654553765
Jewish,49.0,0.00121902676883272,31.0,0.00200361944157187,23.0,0.00130615026406951,45.0,0.000913946828604505,148.0,0.00120802520528266


In [5]:
new_table = c1.topandas()




In [6]:
import numpy as np
new_table['OBS'].replace('', np.nan, inplace=True)
new_table.dropna(subset=['OBS'], inplace=True)
new_table.rename(columns={'OBS': 'Value'}, inplace=True)
new_table['Value'] = new_table['Value'].astype(int)
new_table['Value'] = new_table['Value'].map(lambda x:''
                                  if (x == '-')
                                  else int(x))

In [7]:
new_table['Basis of treatment'] = new_table['Treatment group'].map(
    lambda x: {
        'Religion':'religion',
        "Baha'i":"religion/bahai",
        'Buddhist':'religion/buddhist',
        'Christian':'religion/christian',
        'Hindu':'religion/hindu',
        'Jain':'religion/jain',
        'Jewish':'religion/jewish',
        'Muslim':'religion/muslim',
        'Pagan':'religion/pagan',
        'Sikh':'religion/sikh',
        'Zoroastrian':'religion/zoroastrian',
        'Other':'religion/other',
        'None':'religion/none',
        'Decline':'religion/decline',
        'Unknown':'religion/unknown',
        'Inconsistent/missing':'religion/inconsistent/missing',
        'Total':'religion/total'        
        }.get(x, x))

In [8]:
import urllib.request as request
import csv
import io
import requests
vrl="https://raw.githubusercontent.com/ONS-OpenData/ref_alcohol/master/codelists/substance-type.csv"
t=requests.get(vrl).content
g=pd.read_csv(io.StringIO(t.decode('utf-8')))
new_table = pd.merge(new_table, g, how = 'left', left_on = 'Clients in treatment', right_on = 'Label')
new_table.columns = ['Substance type' if x=='Notation' else x for x in new_table.columns]
new_table = new_table[['Period','Basis of treatment','Substance type','Measure Type','Value','Unit']]

In [9]:
new_table

Unnamed: 0,Period,Basis of treatment,Substance type,Measure Type,Value,Unit
0,gregorian-interval/2017-04-01T00:00:00/P1Y,religion/bahai,opiate,Count,8,clients-in-treatment
1,gregorian-interval/2017-04-01T00:00:00/P1Y,religion/bahai,non-opiate-only,Count,2,clients-in-treatment
2,gregorian-interval/2017-04-01T00:00:00/P1Y,religion/bahai,non-opiate-and-alcohol,Count,1,clients-in-treatment
3,gregorian-interval/2017-04-01T00:00:00/P1Y,religion/bahai,alcohol-only,Count,5,clients-in-treatment
4,gregorian-interval/2017-04-01T00:00:00/P1Y,religion/bahai,total,Count,16,clients-in-treatment
5,gregorian-interval/2017-04-01T00:00:00/P1Y,religion/buddhist,opiate,Count,243,clients-in-treatment
6,gregorian-interval/2017-04-01T00:00:00/P1Y,religion/buddhist,non-opiate-only,Count,50,clients-in-treatment
7,gregorian-interval/2017-04-01T00:00:00/P1Y,religion/buddhist,non-opiate-and-alcohol,Count,78,clients-in-treatment
8,gregorian-interval/2017-04-01T00:00:00/P1Y,religion/buddhist,alcohol-only,Count,169,clients-in-treatment
9,gregorian-interval/2017-04-01T00:00:00/P1Y,religion/buddhist,total,Count,540,clients-in-treatment
