In [1]:
from tqdm import tqdm
import pandas as pd
import numpy as np

from argos import translate

## Split into parts

In [3]:
data = pd.read_csv('../data/en-fr.csv', dtype={'en': str, 'pl': str}, na_values=[""])
data['fr'] = ''
data = data.rename(columns={'fr': 'pl'})
data = data.dropna(how='any', subset=['en'])

In [14]:
def split_dataframe(df, n):
    rows_per_dataframe = len(df) // n
    indices = np.arange(0, len(df), rows_per_dataframe)
    split_dataframes = [df.iloc[i:i+rows_per_dataframe] for i in indices]
    return split_dataframes

In [15]:
parts = split_dataframe(data, 10)
for idx, part in enumerate(parts):
    part.to_csv(f'../data/en-pl-{idx}.csv', index=False)

## Translate single part

In [2]:
def translate_part(part_path, save_interval=60):
    data = pd.read_csv(part_path)
    for i, row in tqdm(data.iterrows(), total=len(data)):
        if not pd.isna(row['en']):
            print('skip')
            continue
        try:
            data.at[i, 'pl'] = translate(row['en'])
        except Exception:
            print('Error while translating', repr(row['en']))
        
        if i % save_interval == 0:
            data.to_csv(part_path)

In [3]:
translate_part('../data/en-pl-2.csv')

  data = pd.read_csv(part_path)
  0%|          | 0/2252029 [00:00<?, ?it/s]

Error while translating 'Legal and public policy norms on both are likely to be informed by different genetic testing rationales.'


  0%|          | 45/2252029 [00:11<117:21:56,  5.33it/s]

Error while translating 'B. Testing Rationales As the discussion in Part II and Table A illustrate, there would appear to be a consensus within the legal, ethical and public policy literatures that genetic testing raises human rights issues.'
Error while translating 'In particular, the discussion in section II.B.I - which summarizes some of the standards tests relied on to weigh and resolve human right conflicts - indicates that the kind and weight of the objectives, the necessity of the chosen means and whether they relate rationally to the stated objectives, potential alternatives, and the balance between positive and negative effects, are some of the critical factors in determining the lawfulness of practices that infringe human rights.'
Error while translating 'Accordingly, a major challenge for genetic testing policy is to articulate, precisely, the rationales and means of testing interventions.'
Error while translating 'This is important for coherent health policy initiatives bas

  0%|          | 176/2252029 [00:12<20:32:25, 30.45it/s]

Error while translating 'Reasonable minds may differ over how much employer paternalism based on employee safety is legitimate.'
Error while translating 'The court ruled that a petrochemical company had violated federal disability discrimination law when it refused to rehire a worker after a routine employment medical exam had revealed that the employee had a liver condition that the company feared might be aggravated by hazardous chemical work.'
Error while translating '139 The ruling is consistent with an earlier U.S. ruling on the paternalistic exclusion of a building repairer with diabetes from the workplace.'
Error while translating '140 Second, initiatives might be undertaken to protect fellow employees from safety risks associated with late onset genetic disorders.'
Error while translating "If it were determined, on the basis of objective scientific evidence, that an employee's diabetes posed significant safety risks to co-workers, then the medical management of the worker's dia

  0%|          | 299/2252029 [00:12<8:37:08, 72.57it/s] 

Error while translating 'Indeed, as indicated, the nature and potential abuse of the information received from predictive genetic testing in non-therapeutic contexts have prompted some in the international community to prohibit or strictly regulate non-therapeutic predictive testing.'
Error while translating 'Genetic and Race Discrimination - Screen and Exclude or Monitor?'
Error while translating 'Those who receive the sickle cell gene from both parents will have the chronic anemia and fragile, abnormal blood cells characteristic of the disease.'
Error while translating 'Particular circumstances such as dehydration and acute oxygen deprivation can provoke these fragile blood cells to sickle.'
Error while translating 'The sickling, in turn, prevents the transport of oxygen to tissues, and so may cause organ damage.'
Error while translating 'In 1970, at about the time a test was developed to screen for sickle cell, the medical literature reported the deaths of four African-American army

  0%|          | 446/2252029 [00:12<3:57:21, 158.10it/s]

Error while translating 'It would also advance within Canada the principles of the Universal Declaration of Human Rights, the International Covenant on Civil and Political Rights, and the UNESCO Declaration.'
Error while translating 'It would begin to transform the CHRA from a strictly non-discrimination statute towards a full human rights law.'
Error while translating 'Modernization of the CHRA is consistent with human privacy needs in the face of the unfolding revolutions in genetic and information technology.'
Error while translating 'This should be made part of a proposed review of the Privacy Act.'
Error while translating 'Finally, to develop effective national norms on genetic privacy protection in such areas as the workplace and insurance, such departments as Health Canada, the Department of Justice Canada, the Canadian Institutes of Health Research, and the Privacy Commission of Canada should begin formal collaboration to do so.'
Error while translating 'Accordingly, the Canadi

  0%|          | 593/2252029 [00:12<2:15:32, 276.84it/s]

Error while translating 'The Uses and Misuses of Personal Data In Employer/Employee Relationships.'
Error while translating 'London,1999 \u2028-Advisory Committee on Genetic Testing.'
Error while translating 'London, 1993:90-92 U.S.A. Institute of Medicine, Committee on Assessing Genetic Risks.'
Error while translating 'Office of the President.'
Error while translating 'To Prohibit Discrimination in Federal Employment Based on Genetic Information.'
Error while translating 'US Department of Health & Human Services, National Institutes of Health (NIH).'
Error while translating '-NIH/Department of Energy Working Group on Ethical, Legal and Social Implications of Human Genome Research.'
Error while translating '-Request for Public Comments on Genetic Testing.'
Error while translating '1999; 64: 67273.\u2028\u2028-Preliminary Recommendations on the Adequacy of Oversight of Genetic Tests.'
Error while translating 'Washington, DC, 2000.'
Error while translating 'Section 902--Definition of the

  0%|          | 662/2252029 [00:12<1:51:52, 335.38it/s]

Error while translating "Although empirical evidence was limited, much of the research suggests that strengthening community-based resources and building communities' capacity to address health issues are very promising strategies."
Error while translating 'While much of the evidence reviewed in this report supports the existence of a healthy immigrant effect in Canada with respect to chronic diseases, it was difficult to draw firm conclusions regarding this effect for many health outcomes and within most immigrant sub-groups.'
Error while translating 'More research is needed to better answer questions about whether the health status of immigrants is improving, how health determinants change over time, and the effect of acculturation on health.'
Error while translating 'It is recommended that steps be taken to strengthen existing databases, and to develop new databases on immigration and health in Canada.'
Error while translating 'Introduction The purpose of this report is to review re

  0%|          | 794/2252029 [00:13<1:29:45, 418.06it/s]

Error while translating "Rather, the results of the logistic regression models suggested that socio-economic factors were more important for immigrants than for non-immigrants and that there was no simple explanation for the complexity of immigrants' experiences."
Error while translating 'Laroche (2000) found that immigrants and Canadian-born persons who were female, of lowincome or had not completed secondary education were more likely to suffer from long-term disabilities than men with a high household income or high educational attainment.'
Error while translating 'A study of Korean Canadians suggested social and psychological resources were important for the successful adaptation of immigrants and were significant predictors of health outcomes (Noh & Avison, 1996).'
Error while translating 'The study alsofound that economic class immigrants reported higher levels of satisfaction with social support than family class immigrants and refugees.'
Error while translating '(1999) also exp

  0%|          | 925/2252029 [00:13<1:15:58, 493.88it/s]

Error while translating 'In their review of the literature on the health problems of immigrants in the United States, Flaskerud & Kim (1999) reported that "deaths due to cancer increased at faster rates among Asian and Pacific Islanders than any other racial or ethnic group."'
Error while translating 'Although Asian women had a lower incidence of breast cancer and better survival rates in comparison to other ethnic groups, there was well-documented evidence that incidence and mortality rates were increasing among second-generation women.'
Error while translating 'Maskarinec (2000) compared breast cancer risk among women of Japanese ancestry living in Asia and in the United States, including Hawaii, and found that while the first generation experienced only a small change in breast cancer rates, the second and third generations experienced considerable changes.'
Error while translating 'This was especially the case among women who immigrated early in life (Carballo et al., 1998).'
Error

  0%|          | 1000/2252029 [00:15<9:48:41, 63.73it/s]


KeyboardInterrupt: 

## Join parts

In [None]:
# TODO