Skip to content

Commit

Permalink
RI: extract_text
Browse files Browse the repository at this point in the history
  • Loading branch information
jamesturk committed Apr 24, 2012
1 parent 10b9535 commit c3d2852
Showing 1 changed file with 8 additions and 1 deletion.
9 changes: 8 additions & 1 deletion openstates/ri/__init__.py
@@ -1,4 +1,6 @@
import datetime
from billy.fulltext import (pdfdata_to_text, oyster_text,
text_after_line_numbers)

metadata = dict(
_partial_vote_bill_id=True,
Expand Down Expand Up @@ -30,8 +32,13 @@ def session_list():
return url_xpath( 'http://status.rilin.state.ri.us/bill_history.aspx?mode=previous',
"//select[@name='ctl00$rilinContent$cbYear']/option/text()" )

@oyster_text
def extract_text(oyster_doc, data):
return text_after_line_numbers(pdfdata_to_text(data))

document_class = dict(
AWS_PREFIX = 'documents/ri/',
update_mins = 24*7*60,
extract_text = extract_text,
onchanged = []
)
)

0 comments on commit c3d2852

Please sign in to comment.