# Synthesizing data

In [1]:
WIKI_FN = '../wiki/data.jobcensus.rc.wiki.2020-12-2.csv'

In [2]:
import pandas as pd,os,sys
from datetime import datetime
import warnings,re
warnings.filterwarnings('ignore')

## Load data

In [3]:
df_wiki0 = pd.read_csv(WIKI_FN)

In [4]:
df_wiki0[:2]

Unnamed: 0,disc_page,year,page,page_group,section_content,section_links,section_title,IsTT,IsUni,JobType,JobID
0,Rhetoric/Composition 2011,2011,Rhetoric/Composition_2011,Rhetoric/Composition,"<span class=""",,Rhetoric/Composition Jobs 2011,,n,Unknown,Rhetoric/Composition Jobs 2011
1,Rhetoric/Composition 2011,2011,Rhetoric/Composition_2011,Rhetoric/Composition,Link - first posting on page\nSubfield/descrip...,http://www.acu.edu/academics/provost/positions...,"Abilene Christian University (Abilene, TX)",y,y,TT,http://www.acu.edu/academics/provost/positions...


In [5]:
df_wiki0['JobSource']='Wiki'

## Rename cols

In [6]:
df_wiki = df_wiki0[df_wiki0.IsUni=='y'][['section_title','year','section_links','JobType','page_group','JobSource']].fillna('')
df_wiki.columns=['JobTitle','JobYear','JobLink','JobType','JobField','JobSource']
df_wiki

Unnamed: 0,JobTitle,JobYear,JobLink,JobType,JobField,JobSource
1,"Abilene Christian University (Abilene, TX)",2011,http://www.acu.edu/academics/provost/positions...,TT,Rhetoric/Composition,Wiki
2,Alfred State College (NY),2011,http://www.higheredjobs.com/faculty/details.cf...,TT,Rhetoric/Composition,Wiki
3,American University of Beirut,2011,mailto:as_dean@aub.edu.lb | http://www.aub.edu...,Unknown,Rhetoric/Composition,Wiki
4,"Angelo State University (San Angelo, TX)",2011,http://www.higheredjobs.com/search/details.cfm...,TT,Rhetoric/Composition,Wiki
5,Arizona State University (Advanced Assistant P...,2011,http://www.asu.edu/clas/english | http://www.w...,Unknown,Rhetoric/Composition,Wiki
...,...,...,...,...,...,...
9359,Pacific University (USA:OR) - Visiting Assista...,2020,https://www.pacificu.edu/academics/academic-re...,Non-TT,Rhetoric/Composition,Wiki
9360,University of Tampa (USA:FL) - Professor of In...,2020,,Non-TT,Rhetoric/Composition,Wiki
9361,"Field Instructor, Rhetoric And Composition",2020,,Non-TT,Rhetoric/Composition,Wiki
9362,Weber State University (USA:UT) - Visiting Ass...,2020,https://jobs.weber.edu/postings/9890,Non-TT,Rhetoric/Composition,Wiki


In [7]:
df_wiki[(df_wiki.JobYear == 2020) & (df_wiki.JobField=='Rhetoric/Composition')]

Unnamed: 0,JobTitle,JobYear,JobLink,JobType,JobField,JobSource
9279,Allen University: Assistant Professor of English,2020,,TT,Rhetoric/Composition,Wiki
9280,"Brock University: Assistant Professor, Busines...",2020,https://brocku.wd3.myworkdayjobs.com/en-US/bro...,TT,Rhetoric/Composition,Wiki
9281,Baruch College: Lecturer - Writing,2020,https://home.cunyfirst.cuny.edu/psp/cnyepprd/G...,Non-TT,Rhetoric/Composition,Wiki
9282,Baruch College: Assistant Professor - Digital ...,2020,https://home.cunyfirst.cuny.edu/psp/cnyepprd/G...,TT,Rhetoric/Composition,Wiki
9283,University of Central Florida: Associate Profe...,2020,https://jobs.ucf.edu/en-us/job/498553/associat...,TT,Rhetoric/Composition,Wiki
...,...,...,...,...,...,...
9359,Pacific University (USA:OR) - Visiting Assista...,2020,https://www.pacificu.edu/academics/academic-re...,Non-TT,Rhetoric/Composition,Wiki
9360,University of Tampa (USA:FL) - Professor of In...,2020,,Non-TT,Rhetoric/Composition,Wiki
9361,"Field Instructor, Rhetoric And Composition",2020,,Non-TT,Rhetoric/Composition,Wiki
9362,Weber State University (USA:UT) - Visiting Ass...,2020,https://jobs.weber.edu/postings/9890,Non-TT,Rhetoric/Composition,Wiki


### Clean links

In [8]:
def clean_wiki_links(x):
    for l in str(x).split(' | '):
        if 'joblist.mla.org' in l:
            return '/'.join(l.split('/')[:-2])
    return x
df_wiki['JobLink_norm']=df_wiki['JobLink'].apply(clean_wiki_links)

In [9]:
df_wiki.JobLink_norm.value_counts()

                                                                                                                                                                                                                                                                                                   954
https://academicjobs.wikia.org/index.php?title=Rhetoric/Composition_2012#top                                                                                                                                                                                                                        61
https://apply.interfolio.com/22610 | http://www.higheredjobs.com/faculty/details.cfm?JobCode=175753939&Title=Assistant%20Professor%20of%20English | http://www.higheredjobs.com/faculty/details.cfm?JobCode=175849175&Title=Assistant%20Professor%20of%20English                                    13
http://jobs.gmu.edu/                                                                                               

### Find overlap

In [10]:
df_all = df_wiki #.append(df_mla)
df_all

Unnamed: 0,JobTitle,JobYear,JobLink,JobType,JobField,JobSource,JobLink_norm
1,"Abilene Christian University (Abilene, TX)",2011,http://www.acu.edu/academics/provost/positions...,TT,Rhetoric/Composition,Wiki,http://www.acu.edu/academics/provost/positions...
2,Alfred State College (NY),2011,http://www.higheredjobs.com/faculty/details.cf...,TT,Rhetoric/Composition,Wiki,http://www.higheredjobs.com/faculty/details.cf...
3,American University of Beirut,2011,mailto:as_dean@aub.edu.lb | http://www.aub.edu...,Unknown,Rhetoric/Composition,Wiki,mailto:as_dean@aub.edu.lb | http://www.aub.edu...
4,"Angelo State University (San Angelo, TX)",2011,http://www.higheredjobs.com/search/details.cfm...,TT,Rhetoric/Composition,Wiki,http://www.higheredjobs.com/search/details.cfm...
5,Arizona State University (Advanced Assistant P...,2011,http://www.asu.edu/clas/english | http://www.w...,Unknown,Rhetoric/Composition,Wiki,http://www.asu.edu/clas/english | http://www.w...
...,...,...,...,...,...,...,...
9359,Pacific University (USA:OR) - Visiting Assista...,2020,https://www.pacificu.edu/academics/academic-re...,Non-TT,Rhetoric/Composition,Wiki,https://www.pacificu.edu/academics/academic-re...
9360,University of Tampa (USA:FL) - Professor of In...,2020,,Non-TT,Rhetoric/Composition,Wiki,
9361,"Field Instructor, Rhetoric And Composition",2020,,Non-TT,Rhetoric/Composition,Wiki,
9362,Weber State University (USA:UT) - Visiting Ass...,2020,https://jobs.weber.edu/postings/9890,Non-TT,Rhetoric/Composition,Wiki,https://jobs.weber.edu/postings/9890


In [11]:
# drop duplicates
df_all=df_all.drop_duplicates(['JobTitle','JobYear','JobLink'])
df_all

Unnamed: 0,JobTitle,JobYear,JobLink,JobType,JobField,JobSource,JobLink_norm
1,"Abilene Christian University (Abilene, TX)",2011,http://www.acu.edu/academics/provost/positions...,TT,Rhetoric/Composition,Wiki,http://www.acu.edu/academics/provost/positions...
2,Alfred State College (NY),2011,http://www.higheredjobs.com/faculty/details.cf...,TT,Rhetoric/Composition,Wiki,http://www.higheredjobs.com/faculty/details.cf...
3,American University of Beirut,2011,mailto:as_dean@aub.edu.lb | http://www.aub.edu...,Unknown,Rhetoric/Composition,Wiki,mailto:as_dean@aub.edu.lb | http://www.aub.edu...
4,"Angelo State University (San Angelo, TX)",2011,http://www.higheredjobs.com/search/details.cfm...,TT,Rhetoric/Composition,Wiki,http://www.higheredjobs.com/search/details.cfm...
5,Arizona State University (Advanced Assistant P...,2011,http://www.asu.edu/clas/english | http://www.w...,Unknown,Rhetoric/Composition,Wiki,http://www.asu.edu/clas/english | http://www.w...
...,...,...,...,...,...,...,...
9359,Pacific University (USA:OR) - Visiting Assista...,2020,https://www.pacificu.edu/academics/academic-re...,Non-TT,Rhetoric/Composition,Wiki,https://www.pacificu.edu/academics/academic-re...
9360,University of Tampa (USA:FL) - Professor of In...,2020,,Non-TT,Rhetoric/Composition,Wiki,
9361,"Field Instructor, Rhetoric And Composition",2020,,Non-TT,Rhetoric/Composition,Wiki,
9362,Weber State University (USA:UT) - Visiting Ass...,2020,https://jobs.weber.edu/postings/9890,Non-TT,Rhetoric/Composition,Wiki,https://jobs.weber.edu/postings/9890


In [12]:
jf_list = list(set(df_all.JobField))
jf_list

['Environmental',
 'English Literature',
 'Musicology/Ethnomusicology',
 'Romanticism/Victorian/19th',
 'Renaissance',
 'Restoration/18th-Century',
 'Humanities and Social Sciences Postdocs',
 'New Media %26 Digital Humanities',
 'German',
 'Comparative Literature',
 'Theory',
 'British Open',
 '20-21 c. American',
 'New Media and Digital Humanities',
 'African American',
 'Comparative',
 'Children%27s',
 'American Open',
 'Medieval',
 'Social Work',
 'American Studies',
 'Queer/Women%27s/Gender Studies',
 'Community Colleges',
 'Modern British',
 'Music Theory/Composition',
 'TESOL/Applied Linguistics',
 'Queer/Women%27s/Gender Studies 2014#Texas A.26M - TT Advanced Assistant Professor.2C Gender and Sexuality Studies with an Emphasis in',
 'Environmental 2014#Christopher Newport University - Lecturer in English .28Environmental Rhetoric .26 Science Writing.29',
 'Anglophone',
 'CreativeWriting',
 'Spanish and Portuguese',
 'Generalist',
 'Rhetoric/Composition',
 'Other Ethnic American

In [13]:
# sanity check:  -->
df_all[(df_all.JobField=='Rhetoric/Composition') & (df_all.JobYear==2020)]

Unnamed: 0,JobTitle,JobYear,JobLink,JobType,JobField,JobSource,JobLink_norm
9279,Allen University: Assistant Professor of English,2020,,TT,Rhetoric/Composition,Wiki,
9280,"Brock University: Assistant Professor, Busines...",2020,https://brocku.wd3.myworkdayjobs.com/en-US/bro...,TT,Rhetoric/Composition,Wiki,https://brocku.wd3.myworkdayjobs.com/en-US/bro...
9281,Baruch College: Lecturer - Writing,2020,https://home.cunyfirst.cuny.edu/psp/cnyepprd/G...,Non-TT,Rhetoric/Composition,Wiki,https://home.cunyfirst.cuny.edu/psp/cnyepprd/G...
9283,University of Central Florida: Associate Profe...,2020,https://jobs.ucf.edu/en-us/job/498553/associat...,TT,Rhetoric/Composition,Wiki,https://jobs.ucf.edu/en-us/job/498553/associat...
9284,Biola University Assistant/Associate Professor...,2020,https://biola.csod.com/ats/careersite/JobDetai...,TT,Rhetoric/Composition,Wiki,https://joblist.mla.org/job-details/1105
...,...,...,...,...,...,...,...
9359,Pacific University (USA:OR) - Visiting Assista...,2020,https://www.pacificu.edu/academics/academic-re...,Non-TT,Rhetoric/Composition,Wiki,https://www.pacificu.edu/academics/academic-re...
9360,University of Tampa (USA:FL) - Professor of In...,2020,,Non-TT,Rhetoric/Composition,Wiki,
9361,"Field Instructor, Rhetoric And Composition",2020,,Non-TT,Rhetoric/Composition,Wiki,
9362,Weber State University (USA:UT) - Visiting Ass...,2020,https://jobs.weber.edu/postings/9890,Non-TT,Rhetoric/Composition,Wiki,https://jobs.weber.edu/postings/9890


## Prune out unknowns

In [14]:
def get_jobtype(title,link=''):
    title=title.lower()
    rgx = re.compile("(\w[\w']*\w|\w)")
    title_words=rgx.findall(title)
    if 'post-doc' in title or 'postdoc' in title: return 'Postdoc'
    if 'visiting' in title: return 'Non-TT'
    if 'professor' in title or 'open-rank' in title: return 'TT'
    if 'fellowship' in title or 'fellow' in title: return 'Postdoc'
    if 'adjunct' in title or 'part-time' in title: return 'Non-TT'
    if 'director' in title: return 'Non-TT'
    if 'instructor' in title or 'freelance' in title: return 'Non-TT'
    if 'vap' in title_words: return 'Non-TT'
    if 'lecturer' in title: return 'Non-TT'
    if link: return get_jobtype_from_mla(link)
    return 'Unknown'

In [15]:
# Fix missing job type errors
df_all['JobType']=[get_jobtype(x) if y=='Unknown' else y
                    for x,y in zip(df_all['JobTitle'],df_all['JobType'])]#.apply(get_jobtype)

In [16]:
df_all[df_all.JobType=='Unknown']

Unnamed: 0,JobTitle,JobYear,JobLink,JobType,JobField,JobSource,JobLink_norm
3,American University of Beirut,2011,mailto:as_dean@aub.edu.lb | http://www.aub.edu...,Unknown,Rhetoric/Composition,Wiki,mailto:as_dean@aub.edu.lb | http://www.aub.edu...
19,Cal State San Marcos,2011,http://www.csusm.edu/facultyopportunities,Unknown,Rhetoric/Composition,Wiki,http://www.csusm.edu/facultyopportunities
26,Claremont McKenna College,2011,https://webapps.cmc.edu/jobs/staff/staff_openi...,Unknown,Rhetoric/Composition,Wiki,https://webapps.cmc.edu/jobs/staff/staff_openi...
34,Columbia University (NY),2011,http://chronicle.com/jobs/0000649408-01/ | htt...,Unknown,Rhetoric/Composition,Wiki,http://chronicle.com/jobs/0000649408-01/ | htt...
36,Concordia University Chicago,2011,http://www.higheredjobs.com/faculty/details.cf...,Unknown,Rhetoric/Composition,Wiki,http://www.higheredjobs.com/faculty/details.cf...
...,...,...,...,...,...,...,...
9235,Senior Faculty Positions,2020,,Unknown,German,Wiki,
9241,Faculty Positions outside of Canada and the U.S.,2020,https://www.lalia-berlin.com/jobs-1-1,Unknown,German,Wiki,https://www.lalia-berlin.com/jobs-1-1
9242,Multi-Language Faculty Positions,2020,https://aprecruit.berkeley.edu/JPF02679,Unknown,German,Wiki,https://aprecruit.berkeley.edu/JPF02679
9244,Other German-Related Faculty Positions,2020,,Unknown,German,Wiki,


In [17]:
list(set(df_all.JobField.values.tolist()))

['Environmental',
 'English Literature',
 'Musicology/Ethnomusicology',
 'Romanticism/Victorian/19th',
 'Renaissance',
 'Restoration/18th-Century',
 'Humanities and Social Sciences Postdocs',
 'New Media %26 Digital Humanities',
 'German',
 'Comparative Literature',
 'Theory',
 'British Open',
 '20-21 c. American',
 'New Media and Digital Humanities',
 'African American',
 'Comparative',
 'Children%27s',
 'American Open',
 'Medieval',
 'Social Work',
 'American Studies',
 'Queer/Women%27s/Gender Studies',
 'Community Colleges',
 'Modern British',
 'Music Theory/Composition',
 'TESOL/Applied Linguistics',
 'Queer/Women%27s/Gender Studies 2014#Texas A.26M - TT Advanced Assistant Professor.2C Gender and Sexuality Studies with an Emphasis in',
 'Environmental 2014#Christopher Newport University - Lecturer in English .28Environmental Rhetoric .26 Science Writing.29',
 'Anglophone',
 'CreativeWriting',
 'Spanish and Portuguese',
 'Generalist',
 'Rhetoric/Composition',
 'Other Ethnic American

In [18]:
len(df_all)

7348

In [19]:
df_all.loc[(df_all.JobField == 'New Media %26 Digital Humanities'), ('JobField')] = 'New Media and Digital Humanities'
df_all.loc[(df_all.JobField == 'Queer/Women%27s/Gender Studies'), ('JobField')] = 'Queer/Womens/Gender Studies'
df_all.loc[(df_all.JobField == 'Queer/Women%27s/Gender Studies 2014#Texas A.26M - TT Advanced Assistant Professor.2C Gender and Sexuality Studies with an Emphasis in'), ('JobField')] = 'Queer/Womens/Gender Studies'
df_all.loc[(df_all.JobField == 'TESOL / Applied Linguistics'), ('JobField')] = 'TESOL/Applied Linguistics'
df_all.loc[(df_all.JobField == 'Drama, Speech, Film %26 New Media'), ('JobField')] = 'Drama, Speech, Film and New Media'
df_all.loc[(df_all.JobField == 'Environmental 2014#Christopher Newport University - Lecturer in English .28Environmental Rhetoric .26 Science Writing.29'), ('JobField')] = 'Environmental'
len(df_all)

7348

In [20]:
list(set(df_all.JobField.values.tolist()))

['Drama, Speech, Film and New Media',
 'Environmental',
 'English Literature',
 'Musicology/Ethnomusicology',
 'Romanticism/Victorian/19th',
 'Renaissance',
 'Restoration/18th-Century',
 'Humanities and Social Sciences Postdocs',
 'German',
 'Comparative Literature',
 'Theory',
 'Queer/Womens/Gender Studies',
 'British Open',
 '20-21 c. American',
 'New Media and Digital Humanities',
 'African American',
 'Comparative',
 'Children%27s',
 'American Open',
 'Medieval',
 'Social Work',
 'American Studies',
 'Community Colleges',
 'Modern British',
 'Music Theory/Composition',
 'TESOL/Applied Linguistics',
 'Anglophone',
 'CreativeWriting',
 'Spanish and Portuguese',
 'Generalist',
 'Rhetoric/Composition',
 'Other Ethnic American',
 'Communication and Media Studies',
 'Creative Writing']

In [21]:
field_list = [
 'Communication and Media Studies',
 'Rhetoric/Composition',
 'Drama, Speech, Film and New Media',
 'Queer/Womens/Gender Studies',
 'Generalist',
 'New Media and Digital Humanities',
 'TESOL/Applied Linguistics',
 'Humanities and Social Sciences Postdocs',
 'Community Colleges'
]

In [22]:
df_reduced = df_all[df_all.JobField.isin(field_list)]
len(df_reduced)

4468

In [23]:
list(set(df_reduced.JobTitle))

['New York University - Director of Faculty Dev. / Clinical Faculty Position, Expository Writing Program (non-TT)',
 'Middlebury College - Postdoctoral Fellow in the Digital Liberal Arts',
 'Texas A&M University Corpus Christi (TX) - TT Assistant or Associate Professor of English - Writing Studies',
 'Dallas Community College District - North Lake (TX) - Faculty Full Time - English (2 Positions)',
 'James Madison University (3 TT positions, April 1 Deadline)',
 'United States Air Force Academy (CO) - Assistant Professor in Rhetoric and Composition - CAMPUS INTERVIEW SCHEDULED',
 'Clayton State University (GA) - TT Assistant or Associate Professorship in English - CAMPUS INTERVIEWS SCHEDULED',
 'University of Dayton (OH) - TT Assist. Professor: Technical Communication & Medical Humanities - SKYPE INTERVIEW STAGE',
 'Texas Christian University (TCU) - Advanced Assistant/Associate Professor of English - OFFER MADE & ACCEPTED',
 'Eastern Michigan University - TT Asst. Professor of Writing 

In [24]:
df_veracity_check = df_reduced[
    ~df_reduced.JobTitle.str.contains(
            '(Cold\sSpring\sHarbour|Cardinal\sStritch\sU|Loyola\sMaryland|Georgia\sSouthern\sU|Buena\sVista|CalPoly|Notre|Armstrong\sAtlantic|SUNY|Institute|Tech|State|University|College|Faculty|Open\sRank|Coordinator|Curator|Director|Carnegie|Professor|Associate|Instructor|Lecturer|Postdoc|postdoc|Fellow(?:ship)?)', 
            regex=True)
]
print(len(df_veracity_check))
df_veracity_check

26


Unnamed: 0,JobTitle,JobYear,JobLink,JobType,JobField,JobSource,JobLink_norm
92,North Carolina Central,2011,,TT,Rhetoric/Composition,Wiki,
556,Louisville,2011,,Unknown,"Drama, Speech, Film and New Media",Wiki,
612,Users,2011,,TT,TESOL/Applied Linguistics,Wiki,
637,UMASS-Lowell,2011,,Unknown,TESOL/Applied Linguistics,Wiki,
641,Texas A&M-Corpus Christi,2011,,Unknown,TESOL/Applied Linguistics,Wiki,
1022,[see full job ad] - OFFER ACCEPTED,2012,https://academicjobs.wikia.org/index.php?title...,TT,Generalist,Wiki,https://academicjobs.wikia.org/index.php?title...
4484,Asst. Prof - Sexuality Studies - OFFER ACCEPTED,2014,mailto:hmsxdept@sfsu.edu,Unknown,Queer/Womens/Gender Studies,Wiki,mailto:hmsxdept@sfsu.edu
4508,- SKYPE INTERVIEWS SCHEDULED,2014,,TT,Queer/Womens/Gender Studies,Wiki,
4511,"Stephanie Bennett-Smith Chair in Women, Gender...",2014,,Unknown,Queer/Womens/Gender Studies,Wiki,
8687,Edit,2019,https://writing.ufl.edu/%7C | //president.ufl....,Non-TT,Rhetoric/Composition,Wiki,https://writing.ufl.edu/%7C | //president.ufl....


### Issues

Most issues were non-job rows, which disproportionately impacted postdocc positions; notably in 2020.

In [25]:
df_reduced = df_reduced[
    df_reduced.JobTitle.str.contains(
            '(Cold\sSpring\sHarbour|Cardinal\sStritch\sU|Loyola\sMaryland|Georgia\sSouthern\sU|Buena\sVista|CalPoly|Notre|Armstrong\sAtlantic|SUNY|Institute|Tech|State|University|College|Faculty|Open\sRank|Coordinator|Curator|Director|Carnegie|Professor|Associate|Instructor|Lecturer|Postdoc|postdoc|Fellow(?:ship)?)', 
            regex=True)
]
print(len(df_reduced))
df_reduced

4442


Unnamed: 0,JobTitle,JobYear,JobLink,JobType,JobField,JobSource,JobLink_norm
1,"Abilene Christian University (Abilene, TX)",2011,http://www.acu.edu/academics/provost/positions...,TT,Rhetoric/Composition,Wiki,http://www.acu.edu/academics/provost/positions...
2,Alfred State College (NY),2011,http://www.higheredjobs.com/faculty/details.cf...,TT,Rhetoric/Composition,Wiki,http://www.higheredjobs.com/faculty/details.cf...
3,American University of Beirut,2011,mailto:as_dean@aub.edu.lb | http://www.aub.edu...,Unknown,Rhetoric/Composition,Wiki,mailto:as_dean@aub.edu.lb | http://www.aub.edu...
4,"Angelo State University (San Angelo, TX)",2011,http://www.higheredjobs.com/search/details.cfm...,TT,Rhetoric/Composition,Wiki,http://www.higheredjobs.com/search/details.cfm...
5,Arizona State University (Advanced Assistant P...,2011,http://www.asu.edu/clas/english | http://www.w...,TT,Rhetoric/Composition,Wiki,http://www.asu.edu/clas/english | http://www.w...
...,...,...,...,...,...,...,...
9359,Pacific University (USA:OR) - Visiting Assista...,2020,https://www.pacificu.edu/academics/academic-re...,Non-TT,Rhetoric/Composition,Wiki,https://www.pacificu.edu/academics/academic-re...
9360,University of Tampa (USA:FL) - Professor of In...,2020,,Non-TT,Rhetoric/Composition,Wiki,
9361,"Field Instructor, Rhetoric And Composition",2020,,Non-TT,Rhetoric/Composition,Wiki,
9362,Weber State University (USA:UT) - Visiting Ass...,2020,https://jobs.weber.edu/postings/9890,Non-TT,Rhetoric/Composition,Wiki,https://jobs.weber.edu/postings/9890


## Save field names

In [26]:
# Download names
field_alias_fn = 'data.jobcensus.rc.field_aliases.csv'
if not os.path.exists(field_alias_fn):
    df_aliases=df_reduced.JobField.value_counts().reset_index()
    df_aliases.columns=['JobField','Count']
    df_aliases['FieldAlias']=df_aliases['JobField']
    df_aliases[['JobField','FieldAlias','Count']].sort_values('JobField').to_csv(field_alias_fn,index=False)

# Save

In [28]:
now=datetime.now()
date=f'{now.year}-{now.month}-{now.day}'
ofn=f'data.jobcensus.rc.synthesized.{date}.csv'
df_reduced.to_csv(ofn,index=False)