In [None]:
from guide_parser import get_text


url = "https://ks.echr.coe.int/documents/d/echr-ks/guide_art_1_eng"
print(get_text(url))

In [None]:
from guide_parser import GuideParser

paragraphs = GuideParser(guide_id="guide_art_3_eng", starting_string="1.  The Court’s approach to the interpretation").parse()

for i, paragraph in enumerate(paragraphs):
    print(f"{i+1}. {paragraph[0:20]} ... {paragraph[-20:]}")

In [4]:
from guide_parser import GuideParser

parsers = {
    "guide_art_1_eng": GuideParser(guide_id="guide_art_1_eng", remove_patterns=["Concepts of “jurisdiction” and imputability"]),
    "guide_art_2_eng": GuideParser(guide_id="guide_art_2_eng"),
    "guide_art_3_eng": GuideParser(guide_id="guide_art_3_eng", starting_string="1.  The Court’s approach to the interpretation"),
    "guide_art_4_eng": GuideParser(guide_id="guide_art_4_eng"),
    "guide_art_5_eng": GuideParser(guide_id="guide_art_5_eng"),
    "guide_art_6_civil_eng": GuideParser(guide_id="guide_art_6_civil_eng"),
    "guide_art_6_criminal_eng": GuideParser(guide_id="guide_art_6_criminal_eng"),
    "guide_art_7_eng": GuideParser(guide_id="guide_art_7_eng", starting_string="1.  The guarantee enshrined in Article 7"),
    "guide_art_8_eng": GuideParser(guide_id="guide_art_8_eng"),
    "guide_art_9_eng": GuideParser(guide_id="guide_art_9_eng"),
    "guide_art_10_eng": GuideParser(guide_id="guide_art_10_eng"),
    "guide_art_11_eng": GuideParser(guide_id="guide_art_11_eng"),
    "guide_art_12_eng": GuideParser(guide_id="guide_art_12_eng", starting_string="1.  Article 12 of the Convention guarantees"),
    "guide_art_13_eng": GuideParser(guide_id="guide_art_13_eng"),
    "guide_art_14_art_1_protocol_12_eng": GuideParser(guide_id="guide_art_14_art_1_protocol_12_eng"),
    "guide_art_15_eng": GuideParser(guide_id="guide_art_15_eng"),
    "guide_art_17_eng": GuideParser(guide_id="guide_art_17_eng"),
    "guide_art_18_eng": GuideParser(guide_id="guide_art_18_eng"),
    "Admissibility_guide_ENG": GuideParser(guide_id="Admissibility_guide_ENG", url="https://www.echr.coe.int/documents/d/echr/", starting_string="1.  The  system  of  protection  of  fundamental  rights"),
    "guide_art_46_eng": GuideParser(guide_id="guide_art_46_eng", starting_string="1.  One of the most significant features of the Convention"),
    "guide_art_1_protocol_1_eng": GuideParser(guide_id="guide_art_1_protocol_1_eng"),
    "guide_art_2_protocol_1_eng": GuideParser(guide_id="guide_art_2_protocol_1_eng"),
    "guide_art_3_protocol_1_eng": GuideParser(guide_id="guide_art_3_protocol_1_eng"),
    "guide_art_2_protocol_4_eng": GuideParser(guide_id="guide_art_2_protocol_4_eng", starting_string="1.  Article 2 of Protocol No. 4 guarantees three"),
    "guide_art_3_protocol_4_eng": GuideParser(guide_id="guide_art_3_protocol_4_eng", starting_string="1.  Article 3, Protocol No. 4 guarantees two"),
    "guide_art_4_protocol_4_eng": GuideParser(guide_id="guide_art_4_protocol_4_eng"),
    "guide_art_1_protocol_7_eng": GuideParser(guide_id="guide_art_1_protocol_7_eng", starting_string="1.  Protocol No. 7 to the European Convention"),
    "guide_art_2_protocol_7_eng": GuideParser(guide_id="guide_art_2_protocol_7_eng", starting_string="1.  Article 2  of  Protocol  No.  7  complements  the  guarantees"),
    "guide_art_4_protocol_7_eng": GuideParser(guide_id="guide_art_4_protocol_7_eng", starting_string="1.  Protocol No. 7 to the Convention"),
    "guide_data_protection_eng": GuideParser(guide_id="guide_data_protection_eng", starting_string="1.  Technological progress has led to a quantum"),
    "guide_environment_eng": GuideParser(guide_id="guide_environment_eng", starting_string="1.  The positive obligation on States to take"),
    "guide_immigration_eng": GuideParser(guide_id="guide_immigration_eng", starting_string="1.  The present  document is"),
    "guide_mass_protests_eng": GuideParser(guide_id="guide_mass_protests_eng", starting_string="1.  The  present  Guide  analyses  the  Court’s"),
    "guide_prisoners_rights_eng": GuideParser(guide_id="guide_prisoners_rights_eng", starting_string="1.  The Court is frequently called upon to"),
    "guide_lgbti_rights_eng": GuideParser(guide_id="guide_lgbti_rights_eng", starting_string="1.  The  Convention  is  a  living  instrument  which"),
    "guide_social_rights_eng": GuideParser(guide_id="guide_social_rights_eng", starting_string="1.  The Convention as adopted in 1950 reflected"),
    "guide_terrorism_eng": GuideParser(guide_id="guide_terrorism_eng", starting_string="1.   Since its first ever judgment Lawless v. Ireland")
}

In [10]:
import pandas as pd
from pandas import DataFrame

def replace_guide(guide_id: str, df: DataFrame):
    aclg_df = pd.read_csv("echr_case_law_guides.csv")
    aclg_df = aclg_df[aclg_df['guide_id'] != guide_id]  # remove old entries
    new_df = pd.concat([aclg_df, df])  # add new entries
    new_df = new_df.loc[:, ~new_df.columns.str.startswith('Unnamed')]
    new_df.to_csv("echr_case_law_guides.csv", index=False)  # save to CSV

parser = parsers["guide_art_1_eng"]
df = parser.to_csv()
df

replace_guide("guide_art_1_eng", df)

In [None]:
import pandas as pd

df = pd.DataFrame()

for key, parser in parsers.items():
    dfg = parser.to_csv()
    df = pd.concat([df, dfg], ignore_index=True)
    df = df.loc[:, ~df.columns.str.startswith('Unnamed')]
    print(key, len(paragraphs))

df.to_csv("echr_case_law_guides.csv", index=False)
df