# ConSciScanner - Readability in Py27

This notebook should be run in a Python 2 environment.

It also assumes 'textstat' is installed, which can be done with:

$ pip install textstat

In [75]:
import os

# Import textstat
from textstat.textstat import textstatistics

# Import custom code
from consc.data import load_folder

In [76]:
# Add paths for custom code & data
base_path = os.path.dirname(os.getcwd())
dat_path = os.path.join(base_path, 'Data')

In [77]:
# Set term to analyze
current_term = 'autism'

# Load the data
paper_dat = load_folder('Papers', current_term, dat_path)
press_dat = load_folder('PRs', current_term, dat_path)

In [78]:
# Initialize textstat object
ts = textstatistics()

In [79]:
# Set an index to test run analysis on
ind = 5

In [80]:
print('Syllable Count:')
print(ts.syllable_count(paper_dat[ind].text))
print(ts.syllable_count(press_dat[ind].text))

Syllable Count:
653
1099


In [81]:
print('Flesh-Kincaid Ease:')
print(ts.flesch_reading_ease(paper_dat[ind].text))
print(ts.flesch_reading_ease(press_dat[ind].text))

Flesh-Kincaid Ease:
19.91
47.32


In [82]:
print('Flesh-Kincaid Grade:')
print(ts.flesch_kincaid_grade(paper_dat[ind].text))
print(ts.flesch_kincaid_grade(press_dat[ind].text))

Flesh-Kincaid Grade:
16.9
12.6


In [83]:
print('Automated Readability Index:')
print(ts.automated_readability_index(paper_dat[ind].text))
print(ts.automated_readability_index(press_dat[ind].text))

Automated Readability Index:
20.8
15.4


In [84]:
print('Coleman Liau Index:')
print(ts.coleman_liau_index(paper_dat[ind].text))
print(ts.coleman_liau_index(press_dat[ind].text))

Coleman Liau Index:
19.21
13.7


In [85]:
print('Dale Chall Readability Score:')
print(ts.dale_chall_readability_score(paper_dat[ind].text))
print(ts.dale_chall_readability_score(press_dat[ind].text))

Dale Chall Readability Score:
9.72
8.78


In [86]:
print('Gunning Fog:')
print(ts.gunning_fog(paper_dat[ind].text))
print(ts.gunning_fog(press_dat[ind].text))

Gunning Fog:
24.4991044776
21.5635413643


In [87]:
print('Smog Index:')
print(ts.smog_index(paper_dat[ind].text))
print(ts.smog_index(press_dat[ind].text))

Smog Index:
19.1
13.7


In [88]:
print('Linsear Write Formula:')
print(ts.linsear_write_formula(paper_dat[ind].text))
print(ts.linsear_write_formula(press_dat[ind].text))

Linsear Write Formula:
11.25
13.25


In [89]:
print('Consensus measure (text-standard):')
print(ts.text_standard(paper_dat[ind].text))
print(ts.text_standard(press_dat[ind].text))

Consensus measure (text-standard):
20th and 21th grade
13th and 14th grade
