# Debates in the Oireachtas: 02 - Dataframes


In [3]:
import os
import sys
import uuid
import json
import lzma
import requests
from glob import glob
from datetime import datetime
from multiprocessing import Pool
import pandas as pd
from pandas.io.json import json_normalize

#import tqdm
from tqdm import tqdm_notebook

# Max results available for paging through with limit & skip is 10,000 so splitting by years works best
def save_page_year(page, year, overwrite=False):
    fname = "../data/{}/{}.json.xz".format(page,year)
    url = "https://api.oireachtas.ie/v1/{}?date_start={}&date_end={}&limit=10000".format(page, year, year+1)
    cache_url(url, fname)

# Save a given url as a file
def cache_url(url, fname, overwrite=False):
    if os.path.isfile(fname) and not overwrite:
        return

    data = requests.get(url).content
    with lzma.open(fname, 'wb') as f:            
        f.write(data)

# Show Progress bar and perform a function on an iterable in parallel:
def process_with_progress(func, iterable):
    with Pool(8) as p:
        results = list(tqdm_notebook(p.imap(func, iterable), total=len(iterable)))
    return results

# Preprocess:

# Flatten json / dict values in a column
def flatten_column(df, column):
    tmp_df = json_normalize([r for r in df[column]])
    tmp_df.rename(columns=lambda k: column+'.'+k, inplace=True)
    tmp_df.index = df.index
    return tmp_df

def flatten_dataframe_columns(df, columns):
    df_expanded = pd.concat([flatten_column(df, column) for column in columns], axis=1)
    df.drop(columns, axis=1, inplace=True) # remove flattened originally json columns
    df = pd.concat([df_expanded, df], axis=1)
    return df

In [4]:
def save_debates_page(year, overwrite=False):
    save_page_year('debates', year, overwrite)
    
    
# Entire dataset: 19349 as of 15-12-2017, starts at 1919
years = range(1919, datetime.now().year + 1)
print("Debates Pages:")
process_with_progress(save_debates_page, years)

# Update this year
save_debates_page(datetime.now().year, True)

Debates Pages:


HBox(children=(IntProgress(value=0, max=101), HTML(value='')))




In [5]:
with lzma.open('../data/debates/2019.json.xz', 'rb') as f:
    preview = json.loads(f.read().decode('utf-8'))

JSONDecodeError: Expecting value: line 1 column 3433913 (char 3433912)

In [7]:
RenderJSON(preview)

In [None]:
#preview

In [9]:
# Load Data from a single file and return dataframe
def debates_df(fname):
    with lzma.open(fname, 'rb') as f:
        data = json.loads(f.read().decode('utf-8'))
        #print(fname, len(data['results']))
        
        # We don't care about the "head" part for now, just "results"
        records = json.dumps([r['debateRecord'] for r in data['results']])
        df = pd.read_json(records, orient='records', dtype=False)
        return df

In [14]:
debates_df("data/year/2007.json.xz")

Unnamed: 0,date,debateSections,lastUpdated,debateType,formats,chamber,counts,uri,house
0,2007-12-20,"[{'debateSection': {'debateType': 'prelude', '...",2017-03-24T19:42:28+00:00,debate,"{'pdf': None, 'xml': {'uri': '/akn/ie/debateRe...","{'showAs': 'Seanad Éireann', 'uri': '/ie/oirea...","{'questionCount': 0, 'billCount': 5, 'contribu...",/akn/ie/debateRecord/seanad/2007-12-20/debate/...,"{'showAs': '23rd Seanad', 'committeeCode': '',..."
1,2007-12-19,"[{'debateSection': {'debateType': 'prelude', '...",2017-03-24T19:28:12+00:00,debate,"{'pdf': None, 'xml': {'uri': '/akn/ie/debateRe...","{'showAs': 'Dáil Éireann', 'uri': '/ie/oireach...","{'questionCount': 380, 'billCount': 1, 'contri...",/akn/ie/debateRecord/dail/2007-12-19/debate/main,"{'showAs': '30th Dáil', 'committeeCode': '', '..."
2,2007-12-19,"[{'debateSection': {'debateType': 'prelude', '...",2017-03-24T18:29:06+00:00,debate,"{'pdf': None, 'xml': {'uri': '/akn/ie/debateRe...","{'showAs': 'JOINT COMMITTEE ON ENTERPRISE, TRA...","{'questionCount': 0, 'billCount': 0, 'contribu...",/akn/ie/debateRecord/joint_committee_on_enterp...,"{'showAs': 'JOINT COMMITTEE ON ENTERPRISE, TRA..."
3,2007-12-19,"[{'debateSection': {'debateType': 'prelude', '...",2017-03-24T18:32:56+00:00,debate,"{'pdf': None, 'xml': {'uri': '/akn/ie/debateRe...","{'showAs': 'SELECT COMMITTEE ON ENTERPRISE, TR...","{'questionCount': 0, 'billCount': 1, 'contribu...",/akn/ie/debateRecord/select_committee_on_enter...,"{'showAs': 'SELECT COMMITTEE ON ENTERPRISE, TR..."
4,2007-12-19,"[{'debateSection': {'debateType': 'prelude', '...",2017-03-24T18:30:42+00:00,debate,"{'pdf': None, 'xml': {'uri': '/akn/ie/debateRe...",{'showAs': 'JOINT COMMITTEE ON FOREIGN AFFAIRS...,"{'questionCount': 0, 'billCount': 0, 'contribu...",/akn/ie/debateRecord/joint_committee_on_foreig...,{'showAs': 'JOINT COMMITTEE ON FOREIGN AFFAIRS...
5,2007-12-19,"[{'debateSection': {'debateType': 'prelude', '...",2017-03-24T18:28:22+00:00,debate,"{'pdf': None, 'xml': {'uri': '/akn/ie/debateRe...",{'showAs': 'JOINT COMMITTEE ON CLIMATE CHANGE ...,"{'questionCount': 0, 'billCount': 0, 'contribu...",/akn/ie/debateRecord/joint_committee_on_climat...,{'showAs': 'JOINT COMMITTEE ON CLIMATE CHANGE ...
6,2007-12-19,"[{'debateSection': {'debateType': 'prelude', '...",2017-03-24T19:42:28+00:00,debate,"{'pdf': None, 'xml': {'uri': '/akn/ie/debateRe...","{'showAs': 'Seanad Éireann', 'uri': '/ie/oirea...","{'questionCount': 0, 'billCount': 3, 'contribu...",/akn/ie/debateRecord/seanad/2007-12-19/debate/...,"{'showAs': '23rd Seanad', 'committeeCode': '',..."
7,2007-12-18,"[{'debateSection': {'debateType': 'prelude', '...",2017-03-24T18:31:58+00:00,debate,"{'pdf': None, 'xml': {'uri': '/akn/ie/debateRe...",{'showAs': 'JOINT COMMITTEE ON THE ENVIRONMENT...,"{'questionCount': 0, 'billCount': 0, 'contribu...",/akn/ie/debateRecord/joint_committee_on_the_en...,{'showAs': 'JOINT COMMITTEE ON THE ENVIRONMENT...
8,2007-12-18,"[{'debateSection': {'debateType': 'prelude', '...",2017-03-24T18:31:04+00:00,debate,"{'pdf': None, 'xml': {'uri': '/akn/ie/debateRe...",{'showAs': 'JOINT COMMITTEE ON HEALTH AND CHIL...,"{'questionCount': 0, 'billCount': 0, 'contribu...",/akn/ie/debateRecord/joint_committee_on_health...,{'showAs': 'JOINT COMMITTEE ON HEALTH AND CHIL...
9,2007-12-18,"[{'debateSection': {'debateType': 'prelude', '...",2017-03-24T18:30:02+00:00,debate,"{'pdf': None, 'xml': {'uri': '/akn/ie/debateRe...",{'showAs': 'JOINT COMMITTEE ON EUROPEAN SCRUTI...,"{'questionCount': 0, 'billCount': 0, 'contribu...",/akn/ie/debateRecord/joint_committee_on_europe...,{'showAs': 'JOINT COMMITTEE ON EUROPEAN SCRUTI...


In [21]:
# Process all the files and stick them together in a single dataframe:
files = glob('data/year/*.json.xz')

data_frames = process_with_progress(debates_df, files)
df_raw = pd.concat(data_frames, axis=0, sort=True)

HBox(children=(IntProgress(value=0, max=95), HTML(value='')))

of pandas will change to not sort by default.

To accept the future behavior, pass 'sort=False'.


  """


In [25]:
flatten_columns = ['formats','chamber','counts', 'house'] # deal with debateSections later
df_raw = flatten_dataframe_columns(df_raw, flatten_columns)

In [26]:
df_raw.sample(5)

Unnamed: 0,formats.pdf,formats.xml.uri,formats.pdf.uri,chamber.showAs,chamber.uri,counts.questionCount,counts.billCount,counts.divisionCount,counts.contributorCount,counts.debateSectionCount,house.showAs,house.chamberType,house.committeeCode,house.houseCode,house.houseNo,house.uri,date,debateSections,debateType,lastUpdated,uri
286,,/akn/ie/debateRecord/joint_committee_on_social...,,JOINT COMMITTEE ON SOCIAL AND FAMILY AFFAIRS,/ie/oireachtas/committee,0,0,0,15,2,JOINT COMMITTEE ON SOCIAL AND FAMILY AFFAIRS,committee,joint_committee_on_social_and_family_affairs,dail,30,/ie/oireachtas/committee/dail/30/joint_committ...,2009-06-24,"[{'debateSection': {'debateType': 'prelude', '...",debate,2017-03-24T18:31:50+00:00,/akn/ie/debateRecord/joint_committee_on_social...
68,,/akn/ie/debateRecord/seanad/1929-05-15/debate/...,,Seanad Éireann,/ie/oireachtas/house/seanad,0,1,2,25,5,1928 Seanad,house,,seanad,1928,/ie/oireachtas/house/seanad/1928,1929-05-15,"[{'debateSection': {'debateType': 'prelude', '...",debate,2017-03-24T19:33:10+00:00,/akn/ie/debateRecord/seanad/1929-05-15/debate/...
62,,/akn/ie/debateRecord/seanad/1941-05-08/debate/...,,Seanad Éireann,/ie/oireachtas/house/seanad,0,0,0,4,4,3rd Seanad,house,,seanad,3,/ie/oireachtas/house/seanad/3,1941-05-08,"[{'debateSection': {'debateType': 'prelude', '...",debate,2017-03-24T19:34:04+00:00,/akn/ie/debateRecord/seanad/1941-05-08/debate/...
329,,/akn/ie/debateRecord/standing_order_112_select...,/ie/oireachtas/debateRecord/standing_order_112...,Standing Order 112 Select Committee,/ie/oireachtas/committee,0,0,0,3,1,Standing Order 112 Select Committee,committee,standing_order_112_select_committee,dail,32,/ie/oireachtas/committee/dail/32/standing_orde...,2016-06-08,"[{'debateSection': {'debateType': 'debate', 'f...",debate,2017-10-02T10:20:37+01:00,/akn/ie/debateRecord/standing_order_112_select...
62,,/akn/ie/debateRecord/dail/1963-05-30/debate/mu...,,Dáil Éireann,/ie/oireachtas/house/dail,0,1,0,31,35,17th Dáil,house,,dail,17,/ie/oireachtas/house/dail/17,1963-05-30,"[{'debateSection': {'debateType': 'prelude', '...",debate,2017-03-24T19:11:58+00:00,/akn/ie/debateRecord/dail/1963-05-30/debate/main


In [27]:
df_raw.drop(['debateSections','formats.pdf'], axis=1, inplace=True)

In [28]:
describe_with_top_n(df_raw, n=50)

----------

# formats.xml.uri

###  Stats:

Unnamed: 0,formats.xml.uri
count,16560
unique,16559
top,/akn/ie/debateRecord/seanad/1936-01-01/debate/...
freq,2
missing,0


###  Top N:

Unnamed: 0,formats.xml.uri
/akn/ie/debateRecord/seanad/1936-01-01/debate/mul@/main.xml,2
/akn/ie/debateRecord/joint_committee_on_european_affairs/2006-12-14/debate/mul@/main.xml,1
/akn/ie/debateRecord/joint_committee_on_enterprise_and_small_business/2005-10-05/debate/mul@/main.xml,1
/akn/ie/debateRecord/dail/2003-11-19/debate/mul@/main.xml,1
/akn/ie/debateRecord/dail/1986-11-27/debate/mul@/main.xml,1
/akn/ie/debateRecord/select_committee_on_legislation_and_security/1996-12-10/debate/mul@/main.xml,1
/akn/ie/debateRecord/dail/1981-03-04/debate/mul@/main.xml,1
/akn/ie/debateRecord/joint_committee_on_foreign_affairs/2004-11-09/debate/mul@/main.xml,1
/akn/ie/debateRecord/dail/1974-07-03/debate/mul@/main.xml,1
/akn/ie/debateRecord/dail/1929-04-10/debate/mul@/main.xml,1


----------

# formats.pdf.uri

###  Stats:

Unnamed: 0,formats.pdf.uri
count,609
unique,609
top,/ie/oireachtas/debateRecord/dail/2016-04-28/de...
freq,1
missing,15951


###  Top N:

Unnamed: 0,formats.pdf.uri
/ie/oireachtas/debateRecord/dail/2016-04-28/debate/mul@/main.pdf,1
/ie/oireachtas/debateRecord/joint_committee_on_health_and_children/2012-12-06/debate/mul@/main.pdf,1
/ie/oireachtas/debateRecord/dail/2016-01-19/debate/mul@/main.pdf,1
/ie/oireachtas/debateRecord/seanad/2016-06-15/debate/mul@/main.pdf,1
/ie/oireachtas/debateRecord/joint_committee_on_finance_public_expenditure_and_reform/2012-11-22/debate/mul@/main.pdf,1
/ie/oireachtas/debateRecord/dail/2016-05-31/debate/mul@/main.pdf,1
/ie/oireachtas/debateRecord/joint_committee_on_agriculture_food_and_the_marine/2016-09-27/debate/mul@/main.pdf,1
/ie/oireachtas/debateRecord/committee_of_public_accounts/2012-10-04/debate/mul@/main.pdf,1
/ie/oireachtas/debateRecord/joint_committee_on_justice_and_equality/2016-10-05/debate/mul@/main.pdf,1
/ie/oireachtas/debateRecord/dail/2016-10-12/debate/mul@/main.pdf,1


----------

# chamber.showAs

###  Stats:

Unnamed: 0,chamber.showAs
count,16560
unique,251
top,Dáil Éireann
freq,7419
missing,0


###  Top N:

Unnamed: 0,chamber.showAs
Dáil Éireann,7419
Seanad Éireann,3927
JOINT COMMITTEE ON EUROPEAN AFFAIRS,233
COMMITTEE OF PUBLIC ACCOUNTS,195
JOINT COMMITTEE ON HEALTH AND CHILDREN,187
JOINT COMMITTEE ON TRANSPORT,155
JOINT COMMITTEE ON FOREIGN AFFAIRS,144
JOINT COMMITTEE ON FINANCE AND THE PUBLIC SERVICE,134
SELECT COMMITTEE ON FINANCE AND THE PUBLIC SERVICE,132
JOINT COMMITTEE ON EDUCATION AND SCIENCE,131


----------

# chamber.uri

###  Stats:

Unnamed: 0,chamber.uri
count,16560
unique,3
top,/ie/oireachtas/house/dail
freq,7419
missing,0


###  Top N:

Unnamed: 0,chamber.uri
/ie/oireachtas/house/dail,7419
/ie/oireachtas/committee,5214
/ie/oireachtas/house/seanad,3927


----------

# counts.questionCount

###  Stats:

Unnamed: 0,counts.questionCount
count,16560.0
mean,29.988043
std,108.893893
min,0.0
25%,0.0
50%,0.0
75%,0.0
max,1949.0
missing,14653.0


###  Top N:

Unnamed: 0,counts.questionCount
0,14653
123,15
164,14
201,14
284,13
184,13
175,13
157,13
204,11
188,11


----------

# counts.billCount

###  Stats:

Unnamed: 0,counts.billCount
count,16560.0
mean,1.981341
std,2.607334
min,0.0
25%,0.0
50%,1.0
75%,3.0
max,74.0
missing,6199.0


###  Top N:

Unnamed: 0,counts.billCount
0,6199
1,3010
2,2195
3,1715
4,1150
5,860
6,571
7,310
8,199
9,113


----------

# counts.divisionCount

###  Stats:

Unnamed: 0,counts.divisionCount
count,16560.0
mean,0.656159
std,1.423538
min,0.0
25%,0.0
50%,0.0
75%,1.0
max,41.0
missing,11413.0


###  Top N:

Unnamed: 0,counts.divisionCount
0,11413
1,2559
2,1273
3,614
4,303
5,160
6,104
7,46
8,33
9,18


----------

# counts.contributorCount

###  Stats:

Unnamed: 0,counts.contributorCount
count,16560.0
mean,37.228684
std,33.220478
min,0.0
25%,13.0
50%,26.0
75%,50.0
max,166.0
missing,25.0


###  Top N:

Unnamed: 0,counts.contributorCount
11,637
10,590
9,571
13,550
12,548
8,467
14,435
7,429
15,396
16,339


----------

# counts.debateSectionCount

###  Stats:

Unnamed: 0,counts.debateSectionCount
count,16560.0
mean,38.70628
std,76.610986
min,1.0
25%,3.0
50%,9.0
75%,40.0
max,1166.0
missing,0.0


###  Top N:

Unnamed: 0,counts.debateSectionCount
2,2111
3,1915
4,1073
5,745
6,682
7,652
8,603
9,531
10,429
11,337


----------

# house.showAs

###  Stats:

Unnamed: 0,house.showAs
count,16560
unique,310
top,27th Dáil
freq,435
missing,0


###  Top N:

Unnamed: 0,house.showAs
27th Dáil,435
28th Dáil,422
29th Dáil,411
20th Dáil,404
24th Dáil,391
8th Dáil,375
22nd Seanad,374
21st Seanad,352
4th Dáil,351
18th Dáil,346


----------

# house.chamberType

###  Stats:

Unnamed: 0,house.chamberType
count,16560
unique,2
top,house
freq,11346
missing,0


###  Top N:

Unnamed: 0,house.chamberType
house,11346
committee,5214


----------

# house.committeeCode

###  Stats:

Unnamed: 0,house.committeeCode
count,16560.0
unique,208.0
top,
freq,11346.0
missing,11346.0


###  Top N:

Unnamed: 0,house.committeeCode
,11346
joint_committee_on_european_affairs,325
committee_of_public_accounts,288
joint_committee_on_health_and_children,249
joint_committee_on_foreign_affairs,223
joint_committee_on_transport,155
joint_committee_on_finance_and_the_public_service,134
select_committee_on_finance_and_the_public_service,132
joint_committee_on_education_and_science,131
joint_committee_on_enterprise_and_small_business,121


----------

# house.houseCode

###  Stats:

Unnamed: 0,house.houseCode
count,16560
unique,2
top,dail
freq,12633
missing,0


###  Top N:

Unnamed: 0,house.houseCode
dail,12633
seanad,3927


----------

# house.houseNo

###  Stats:

Unnamed: 0,house.houseNo
count,16560
unique,37
top,29
freq,2217
missing,0


###  Top N:

Unnamed: 0,house.houseNo
29,2217
30,1705
28,902
31,856
20,772
27,744
21,708
24,586
19,522
17,498


----------

# house.uri

###  Stats:

Unnamed: 0,house.uri
count,16560
unique,318
top,/ie/oireachtas/house/dail/27
freq,435
missing,0


###  Top N:

Unnamed: 0,house.uri
/ie/oireachtas/house/dail/27,435
/ie/oireachtas/house/dail/28,422
/ie/oireachtas/house/dail/29,411
/ie/oireachtas/house/dail/20,404
/ie/oireachtas/house/dail/24,391
/ie/oireachtas/house/dail/8,375
/ie/oireachtas/house/seanad/22,374
/ie/oireachtas/house/seanad/21,352
/ie/oireachtas/house/dail/4,351
/ie/oireachtas/house/dail/18,346


----------

# date

###  Stats:

Unnamed: 0,date
count,16560
unique,8740
top,2010-12-01 00:00:00
freq,13
first,1919-01-22 00:00:00
last,2016-12-21 00:00:00
missing,0


###  Top N:

Unnamed: 0,date
2010-12-01,13
2008-02-20,12
2010-06-02,12
2009-12-02,11
2003-06-19,11
2008-03-05,11
2005-03-02,10
2008-12-10,10
2016-11-30,10
2016-11-22,10


----------

# debateType

###  Stats:

Unnamed: 0,debateType
count,16560
unique,1
top,debate
freq,16560
missing,0


###  Top N:

Unnamed: 0,debateType
debate,16560


----------

# lastUpdated

###  Stats:

Unnamed: 0,lastUpdated
count,16560
unique,1746
top,2017-03-24T18:28:50+00:00
freq,27
missing,0


###  Top N:

Unnamed: 0,lastUpdated
2017-03-24T18:28:50+00:00,27
2017-03-24T18:29:24+00:00,26
2017-03-24T18:30:06+00:00,26
2017-03-24T18:30:04+00:00,26
2017-03-24T18:31:56+00:00,25
2017-03-24T18:30:44+00:00,25
2017-03-24T18:29:48+00:00,25
2017-03-24T18:29:44+00:00,25
2017-03-24T18:35:22+00:00,25
2017-03-24T18:29:36+00:00,25


----------

# uri

###  Stats:

Unnamed: 0,uri
count,16560
unique,16559
top,/akn/ie/debateRecord/seanad/1936-01-01/debate/...
freq,2
missing,0


###  Top N:

Unnamed: 0,uri
/akn/ie/debateRecord/seanad/1936-01-01/debate/main,2
/akn/ie/debateRecord/dail/1952-11-12/debate/main,1
/akn/ie/debateRecord/dail/1971-02-17/debate/main,1
/akn/ie/debateRecord/joint_committee_on_arts_sport_tourism_community_rural_and_gaeltacht_affairs/2008-10-08/debate/main,1
/akn/ie/debateRecord/seanad/1993-04-08/debate/main,1
/akn/ie/debateRecord/dail/2008-10-29/debate/main,1
/akn/ie/debateRecord/joint_committee_on_justice_equality_defence_and_womens_rights/2009-01-27/debate/main,1
/akn/ie/debateRecord/select_committee_on_justice_equality_defence_and_womens_rights/2005-05-03/debate/main,1
/akn/ie/debateRecord/joint_committee_on_education_and_science/2009-12-02/debate/main,1
/akn/ie/debateRecord/joint_committee_on_european_union_affairs/2012-06-27/debate/main,1


In [29]:
df_raw.to_pickle('debates.p.xz', compression='xz') # gzip is faster, but xz makes much smaller files for git

In [30]:
import pandas_profiling

In [31]:
pandas_profiling.ProfileReport(df_raw)


To register the converters:
	>>> from pandas.plotting import register_matplotlib_converters
	>>> register_matplotlib_converters()
  variable_stats = pd.concat(ldesc, join_axes=pd.Index([names]), axis=1)


0,1
Number of variables,20
Number of observations,16560
Total Missing (%),4.8%
Total size in memory,2.5 MiB
Average record size in memory,160.0 B

0,1
Numeric,6
Categorical,12
Boolean,0
Date,1
Text (Unique),0
Rejected,1
Unsupported,0

0,1
Distinct count,660
Unique (%),4.0%
Missing (%),0.0%
Missing (n),0
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,148
Minimum,0
Maximum,659
Zeros (%),0.6%

0,1
Minimum,0
5-th percentile,8
Q1,44
Median,92
Q3,199
95-th percentile,494
Maximum,659
Range,659
Interquartile range,155

0,1
Standard deviation,148.42
Coef of variation,1.0028
Kurtosis,1.2412
Mean,148
MAD,114.67
Skewness,1.4437
Sum,2450937
Variance,22028
Memory size,129.5 KiB

Value,Count,Frequency (%),Unnamed: 3
0,95,0.6%,
2,95,0.6%,
1,95,0.6%,
3,94,0.6%,
11,94,0.6%,
10,94,0.6%,
12,94,0.6%,
9,94,0.6%,
8,94,0.6%,
7,94,0.6%,

Value,Count,Frequency (%),Unnamed: 3
0,95,0.6%,
1,95,0.6%,
2,95,0.6%,
3,94,0.6%,
4,94,0.6%,

Value,Count,Frequency (%),Unnamed: 3
655,1,0.0%,
656,1,0.0%,
657,1,0.0%,
658,1,0.0%,
659,1,0.0%,

0,1
Distinct count,16559
Unique (%),100.0%
Missing (%),0.0%
Missing (n),0

0,1
/akn/ie/debateRecord/seanad/1936-01-01/debate/mul@/main.xml,2
/akn/ie/debateRecord/joint_committee_on_european_affairs/2006-12-14/debate/mul@/main.xml,1
/akn/ie/debateRecord/joint_committee_on_enterprise_and_small_business/2005-10-05/debate/mul@/main.xml,1
Other values (16556),16556

Value,Count,Frequency (%),Unnamed: 3
/akn/ie/debateRecord/seanad/1936-01-01/debate/mul@/main.xml,2,0.0%,
/akn/ie/debateRecord/joint_committee_on_european_affairs/2006-12-14/debate/mul@/main.xml,1,0.0%,
/akn/ie/debateRecord/joint_committee_on_enterprise_and_small_business/2005-10-05/debate/mul@/main.xml,1,0.0%,
/akn/ie/debateRecord/dail/2003-11-19/debate/mul@/main.xml,1,0.0%,
/akn/ie/debateRecord/dail/1986-11-27/debate/mul@/main.xml,1,0.0%,
/akn/ie/debateRecord/select_committee_on_legislation_and_security/1996-12-10/debate/mul@/main.xml,1,0.0%,
/akn/ie/debateRecord/dail/1981-03-04/debate/mul@/main.xml,1,0.0%,
/akn/ie/debateRecord/joint_committee_on_foreign_affairs/2004-11-09/debate/mul@/main.xml,1,0.0%,
/akn/ie/debateRecord/dail/1974-07-03/debate/mul@/main.xml,1,0.0%,
/akn/ie/debateRecord/dail/1929-04-10/debate/mul@/main.xml,1,0.0%,

0,1
Distinct count,610
Unique (%),3.7%
Missing (%),96.3%
Missing (n),15951

0,1
/ie/oireachtas/debateRecord/joint_committee_on_health_and_children/2012-12-06/debate/mul@/main.pdf,1
/ie/oireachtas/debateRecord/dail/2016-01-19/debate/mul@/main.pdf,1
/ie/oireachtas/debateRecord/seanad/2016-06-15/debate/mul@/main.pdf,1
Other values (606),606
(Missing),15951

Value,Count,Frequency (%),Unnamed: 3
/ie/oireachtas/debateRecord/joint_committee_on_health_and_children/2012-12-06/debate/mul@/main.pdf,1,0.0%,
/ie/oireachtas/debateRecord/dail/2016-01-19/debate/mul@/main.pdf,1,0.0%,
/ie/oireachtas/debateRecord/seanad/2016-06-15/debate/mul@/main.pdf,1,0.0%,
/ie/oireachtas/debateRecord/joint_committee_on_finance_public_expenditure_and_reform/2012-11-22/debate/mul@/main.pdf,1,0.0%,
/ie/oireachtas/debateRecord/dail/2016-05-31/debate/mul@/main.pdf,1,0.0%,
/ie/oireachtas/debateRecord/joint_committee_on_agriculture_food_and_the_marine/2016-09-27/debate/mul@/main.pdf,1,0.0%,
/ie/oireachtas/debateRecord/committee_of_public_accounts/2012-10-04/debate/mul@/main.pdf,1,0.0%,
/ie/oireachtas/debateRecord/joint_committee_on_justice_and_equality/2016-10-05/debate/mul@/main.pdf,1,0.0%,
/ie/oireachtas/debateRecord/dail/2016-10-12/debate/mul@/main.pdf,1,0.0%,
/ie/oireachtas/debateRecord/dail/2016-04-14/debate/mul@/main.pdf,1,0.0%,

0,1
Distinct count,251
Unique (%),1.5%
Missing (%),0.0%
Missing (n),0

0,1
Dáil Éireann,7419
Seanad Éireann,3927
JOINT COMMITTEE ON EUROPEAN AFFAIRS,233
Other values (248),4981

Value,Count,Frequency (%),Unnamed: 3
Dáil Éireann,7419,44.8%,
Seanad Éireann,3927,23.7%,
JOINT COMMITTEE ON EUROPEAN AFFAIRS,233,1.4%,
COMMITTEE OF PUBLIC ACCOUNTS,195,1.2%,
JOINT COMMITTEE ON HEALTH AND CHILDREN,187,1.1%,
JOINT COMMITTEE ON TRANSPORT,155,0.9%,
JOINT COMMITTEE ON FOREIGN AFFAIRS,144,0.9%,
JOINT COMMITTEE ON FINANCE AND THE PUBLIC SERVICE,134,0.8%,
SELECT COMMITTEE ON FINANCE AND THE PUBLIC SERVICE,132,0.8%,
JOINT COMMITTEE ON EDUCATION AND SCIENCE,131,0.8%,

0,1
Distinct count,3
Unique (%),0.0%
Missing (%),0.0%
Missing (n),0

0,1
/ie/oireachtas/house/dail,7419
/ie/oireachtas/committee,5214
/ie/oireachtas/house/seanad,3927

Value,Count,Frequency (%),Unnamed: 3
/ie/oireachtas/house/dail,7419,44.8%,
/ie/oireachtas/committee,5214,31.5%,
/ie/oireachtas/house/seanad,3927,23.7%,

0,1
Distinct count,594
Unique (%),3.6%
Missing (%),0.0%
Missing (n),0
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,29.988
Minimum,0
Maximum,1949
Zeros (%),88.5%

0,1
Minimum,0
5-th percentile,0
Q1,0
Median,0
Q3,0
95-th percentile,228
Maximum,1949
Range,1949
Interquartile range,0

0,1
Standard deviation,108.89
Coef of variation,3.6312
Kurtosis,48.186
Mean,29.988
MAD,53.185
Skewness,5.7489
Sum,496602
Variance,11858
Memory size,129.5 KiB

Value,Count,Frequency (%),Unnamed: 3
0,14653,88.5%,
123,15,0.1%,
164,14,0.1%,
201,14,0.1%,
284,13,0.1%,
184,13,0.1%,
175,13,0.1%,
157,13,0.1%,
204,11,0.1%,
188,11,0.1%,

Value,Count,Frequency (%),Unnamed: 3
0,14653,88.5%,
2,1,0.0%,
7,2,0.0%,
8,1,0.0%,
9,4,0.0%,

Value,Count,Frequency (%),Unnamed: 3
1548,1,0.0%,
1640,1,0.0%,
1683,1,0.0%,
1770,1,0.0%,
1949,1,0.0%,

0,1
Distinct count,30
Unique (%),0.2%
Missing (%),0.0%
Missing (n),0
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,1.9813
Minimum,0
Maximum,74
Zeros (%),37.4%

0,1
Minimum,0
5-th percentile,0
Q1,0
Median,1
Q3,3
95-th percentile,7
Maximum,74
Range,74
Interquartile range,3

0,1
Standard deviation,2.6073
Coef of variation,1.3159
Kurtosis,66.233
Mean,1.9813
MAD,1.8401
Skewness,4.3084
Sum,32811
Variance,6.7982
Memory size,129.5 KiB

Value,Count,Frequency (%),Unnamed: 3
0,6199,37.4%,
1,3010,18.2%,
2,2195,13.3%,
3,1715,10.4%,
4,1150,6.9%,
5,860,5.2%,
6,571,3.4%,
7,310,1.9%,
8,199,1.2%,
9,113,0.7%,

Value,Count,Frequency (%),Unnamed: 3
0,6199,37.4%,
1,3010,18.2%,
2,2195,13.3%,
3,1715,10.4%,
4,1150,6.9%,

Value,Count,Frequency (%),Unnamed: 3
29,1,0.0%,
36,1,0.0%,
50,1,0.0%,
61,1,0.0%,
74,1,0.0%,

0,1
Distinct count,22
Unique (%),0.1%
Missing (%),0.0%
Missing (n),0
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,0.65616
Minimum,0
Maximum,41
Zeros (%),68.9%

0,1
Minimum,0
5-th percentile,0
Q1,0
Median,0
Q3,1
95-th percentile,3
Maximum,41
Range,41
Interquartile range,1

0,1
Standard deviation,1.4235
Coef of variation,2.1695
Kurtosis,73.022
Mean,0.65616
MAD,0.90444
Skewness,5.4334
Sum,10866
Variance,2.0265
Memory size,129.5 KiB

Value,Count,Frequency (%),Unnamed: 3
0,11413,68.9%,
1,2559,15.5%,
2,1273,7.7%,
3,614,3.7%,
4,303,1.8%,
5,160,1.0%,
6,104,0.6%,
7,46,0.3%,
8,33,0.2%,
9,18,0.1%,

Value,Count,Frequency (%),Unnamed: 3
0,11413,68.9%,
1,2559,15.5%,
2,1273,7.7%,
3,614,3.7%,
4,303,1.8%,

Value,Count,Frequency (%),Unnamed: 3
17,2,0.0%,
20,1,0.0%,
22,2,0.0%,
30,1,0.0%,
41,1,0.0%,

0,1
Distinct count,167
Unique (%),1.0%
Missing (%),0.0%
Missing (n),0
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,37.229
Minimum,0
Maximum,166
Zeros (%),0.2%

0,1
Minimum,0
5-th percentile,7
Q1,13
Median,26
Q3,50
95-th percentile,107
Maximum,166
Range,166
Interquartile range,37

0,1
Standard deviation,33.22
Coef of variation,0.89234
Kurtosis,2.8303
Mean,37.229
MAD,24.826
Skewness,1.6965
Sum,616507
Variance,1103.6
Memory size,129.5 KiB

Value,Count,Frequency (%),Unnamed: 3
11,637,3.8%,
10,590,3.6%,
9,571,3.4%,
13,550,3.3%,
12,548,3.3%,
8,467,2.8%,
14,435,2.6%,
7,429,2.6%,
15,396,2.4%,
16,339,2.0%,

Value,Count,Frequency (%),Unnamed: 3
0,25,0.2%,
1,39,0.2%,
2,21,0.1%,
3,50,0.3%,
4,104,0.6%,

Value,Count,Frequency (%),Unnamed: 3
162,11,0.1%,
163,12,0.1%,
164,2,0.0%,
165,4,0.0%,
166,1,0.0%,

0,1
Distinct count,487
Unique (%),2.9%
Missing (%),0.0%
Missing (n),0
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,38.706
Minimum,1
Maximum,1166
Zeros (%),0.0%

0,1
Minimum,1
5-th percentile,2
Q1,3
Median,9
Q3,40
95-th percentile,181
Maximum,1166
Range,1165
Interquartile range,37

0,1
Standard deviation,76.611
Coef of variation,1.9793
Kurtosis,33.258
Mean,38.706
MAD,44.002
Skewness,4.6438
Sum,640976
Variance,5869.2
Memory size,129.5 KiB

Value,Count,Frequency (%),Unnamed: 3
2,2111,12.7%,
3,1915,11.6%,
4,1073,6.5%,
5,745,4.5%,
6,682,4.1%,
7,652,3.9%,
8,603,3.6%,
9,531,3.2%,
10,429,2.6%,
11,337,2.0%,

Value,Count,Frequency (%),Unnamed: 3
1,308,1.9%,
2,2111,12.7%,
3,1915,11.6%,
4,1073,6.5%,
5,745,4.5%,

Value,Count,Frequency (%),Unnamed: 3
1001,1,0.0%,
1013,1,0.0%,
1139,1,0.0%,
1144,1,0.0%,
1166,1,0.0%,

0,1
Distinct count,310
Unique (%),1.9%
Missing (%),0.0%
Missing (n),0

0,1
27th Dáil,435
28th Dáil,422
29th Dáil,411
Other values (307),15292

Value,Count,Frequency (%),Unnamed: 3
27th Dáil,435,2.6%,
28th Dáil,422,2.5%,
29th Dáil,411,2.5%,
20th Dáil,404,2.4%,
24th Dáil,391,2.4%,
8th Dáil,375,2.3%,
22nd Seanad,374,2.3%,
21st Seanad,352,2.1%,
4th Dáil,351,2.1%,
18th Dáil,346,2.1%,

0,1
Distinct count,2
Unique (%),0.0%
Missing (%),0.0%
Missing (n),0

0,1
house,11346
committee,5214

Value,Count,Frequency (%),Unnamed: 3
house,11346,68.5%,
committee,5214,31.5%,

0,1
Distinct count,208
Unique (%),1.3%
Missing (%),0.0%
Missing (n),0

0,1
,11346
joint_committee_on_european_affairs,325
committee_of_public_accounts,288
Other values (205),4601

Value,Count,Frequency (%),Unnamed: 3
,11346,68.5%,
joint_committee_on_european_affairs,325,2.0%,
committee_of_public_accounts,288,1.7%,
joint_committee_on_health_and_children,249,1.5%,
joint_committee_on_foreign_affairs,223,1.3%,
joint_committee_on_transport,155,0.9%,
joint_committee_on_finance_and_the_public_service,134,0.8%,
select_committee_on_finance_and_the_public_service,132,0.8%,
joint_committee_on_education_and_science,131,0.8%,
joint_committee_on_enterprise_and_small_business,121,0.7%,

0,1
Distinct count,2
Unique (%),0.0%
Missing (%),0.0%
Missing (n),0

0,1
dail,12633
seanad,3927

Value,Count,Frequency (%),Unnamed: 3
dail,12633,76.3%,
seanad,3927,23.7%,

0,1
Distinct count,37
Unique (%),0.2%
Missing (%),0.0%
Missing (n),0

0,1
29,2217
30,1705
28,902
Other values (34),11736

Value,Count,Frequency (%),Unnamed: 3
29,2217,13.4%,
30,1705,10.3%,
28,902,5.4%,
31,856,5.2%,
20,772,4.7%,
27,744,4.5%,
21,708,4.3%,
24,586,3.5%,
19,522,3.2%,
17,498,3.0%,

0,1
Distinct count,318
Unique (%),1.9%
Missing (%),0.0%
Missing (n),0

0,1
/ie/oireachtas/house/dail/27,435
/ie/oireachtas/house/dail/28,422
/ie/oireachtas/house/dail/29,411
Other values (315),15292

Value,Count,Frequency (%),Unnamed: 3
/ie/oireachtas/house/dail/27,435,2.6%,
/ie/oireachtas/house/dail/28,422,2.5%,
/ie/oireachtas/house/dail/29,411,2.5%,
/ie/oireachtas/house/dail/20,404,2.4%,
/ie/oireachtas/house/dail/24,391,2.4%,
/ie/oireachtas/house/dail/8,375,2.3%,
/ie/oireachtas/house/seanad/22,374,2.3%,
/ie/oireachtas/house/seanad/21,352,2.1%,
/ie/oireachtas/house/dail/4,351,2.1%,
/ie/oireachtas/house/dail/18,346,2.1%,

0,1
Distinct count,8740
Unique (%),52.8%
Missing (%),0.0%
Missing (n),0
Infinite (%),0.0%
Infinite (n),0

0,1
Minimum,1919-01-22 00:00:00
Maximum,2016-12-21 00:00:00

0,1
Constant value,debate

0,1
Distinct count,1746
Unique (%),10.5%
Missing (%),0.0%
Missing (n),0

0,1
2017-03-24T18:28:50+00:00,27
2017-03-24T18:29:24+00:00,26
2017-03-24T18:30:06+00:00,26
Other values (1743),16481

Value,Count,Frequency (%),Unnamed: 3
2017-03-24T18:28:50+00:00,27,0.2%,
2017-03-24T18:29:24+00:00,26,0.2%,
2017-03-24T18:30:06+00:00,26,0.2%,
2017-03-24T18:30:04+00:00,26,0.2%,
2017-03-24T18:31:56+00:00,25,0.2%,
2017-03-24T18:30:44+00:00,25,0.2%,
2017-03-24T18:29:48+00:00,25,0.2%,
2017-03-24T18:29:44+00:00,25,0.2%,
2017-03-24T18:35:22+00:00,25,0.2%,
2017-03-24T18:29:36+00:00,25,0.2%,

0,1
Distinct count,16559
Unique (%),100.0%
Missing (%),0.0%
Missing (n),0

0,1
/akn/ie/debateRecord/seanad/1936-01-01/debate/main,2
/akn/ie/debateRecord/dail/1952-11-12/debate/main,1
/akn/ie/debateRecord/dail/1971-02-17/debate/main,1
Other values (16556),16556

Value,Count,Frequency (%),Unnamed: 3
/akn/ie/debateRecord/seanad/1936-01-01/debate/main,2,0.0%,
/akn/ie/debateRecord/dail/1952-11-12/debate/main,1,0.0%,
/akn/ie/debateRecord/dail/1971-02-17/debate/main,1,0.0%,
/akn/ie/debateRecord/joint_committee_on_arts_sport_tourism_community_rural_and_gaeltacht_affairs/2008-10-08/debate/main,1,0.0%,
/akn/ie/debateRecord/seanad/1993-04-08/debate/main,1,0.0%,
/akn/ie/debateRecord/dail/2008-10-29/debate/main,1,0.0%,
/akn/ie/debateRecord/joint_committee_on_justice_equality_defence_and_womens_rights/2009-01-27/debate/main,1,0.0%,
/akn/ie/debateRecord/select_committee_on_justice_equality_defence_and_womens_rights/2005-05-03/debate/main,1,0.0%,
/akn/ie/debateRecord/joint_committee_on_education_and_science/2009-12-02/debate/main,1,0.0%,
/akn/ie/debateRecord/joint_committee_on_european_union_affairs/2012-06-27/debate/main,1,0.0%,

Unnamed: 0,formats.xml.uri,formats.pdf.uri,chamber.showAs,chamber.uri,counts.questionCount,counts.billCount,counts.divisionCount,counts.contributorCount,counts.debateSectionCount,house.showAs,house.chamberType,house.committeeCode,house.houseCode,house.houseNo,house.uri,date,debateType,lastUpdated,uri
0,/akn/ie/debateRecord/seanad/1947-12-19/debate/mul@/main.xml,,Seanad Éireann,/ie/oireachtas/house/seanad,0,8,0,23,9,5th Seanad,house,,seanad,5,/ie/oireachtas/house/seanad/5,1947-12-19,debate,2017-03-24T19:34:42+00:00,/akn/ie/debateRecord/seanad/1947-12-19/debate/main
1,/akn/ie/debateRecord/seanad/1947-12-18/debate/mul@/main.xml,,Seanad Éireann,/ie/oireachtas/house/seanad,0,5,1,20,8,5th Seanad,house,,seanad,5,/ie/oireachtas/house/seanad/5,1947-12-18,debate,2017-03-24T19:34:42+00:00,/akn/ie/debateRecord/seanad/1947-12-18/debate/main
2,/akn/ie/debateRecord/seanad/1947-12-17/debate/mul@/main.xml,,Seanad Éireann,/ie/oireachtas/house/seanad,0,3,0,19,6,5th Seanad,house,,seanad,5,/ie/oireachtas/house/seanad/5,1947-12-17,debate,2017-03-24T19:34:40+00:00,/akn/ie/debateRecord/seanad/1947-12-17/debate/main
3,/akn/ie/debateRecord/seanad/1947-12-12/debate/mul@/main.xml,,Seanad Éireann,/ie/oireachtas/house/seanad,0,2,0,13,5,5th Seanad,house,,seanad,5,/ie/oireachtas/house/seanad/5,1947-12-12,debate,2017-03-24T19:34:40+00:00,/akn/ie/debateRecord/seanad/1947-12-12/debate/main
4,/akn/ie/debateRecord/seanad/1947-12-11/debate/mul@/main.xml,,Seanad Éireann,/ie/oireachtas/house/seanad,0,11,0,22,12,5th Seanad,house,,seanad,5,/ie/oireachtas/house/seanad/5,1947-12-11,debate,2017-03-24T19:34:40+00:00,/akn/ie/debateRecord/seanad/1947-12-11/debate/main
