# Export the Wordlists from Roorda&Dyk to a Master json File

See the [Roorda&Dyk valency corrections notebook](https://shebanq.ancient-data.org/shebanq/static/docs/tools/valence/corr_enrich.html) for the source.

## Updates:
√ 15.01.17, added some new categories based on needs in the CKB_valency notebook. See [Additions](#Additions:)

In [1]:
import json

locatives = set('''
                >RY/ >YL/ >XR/<BR/ <BRH/ <BWR/ <C==/ <JR/ <L=/ 
                <LJ=/ <LJH/ <LJL/ <MD=/ <MDH/ <MH/ <MQ/ <MQ===/ 
                <QB/ BJN/ BJT/ CM CMJM/ CMC/ C<R/ DRK/ FDH/ HR/
                JM/ JRDN/ JRWCLM/ JFR>L/ MDBR/ MW<D/ MWL/ MZBX/ 
                MYRJM/ MQWM/ MR>CWT/ MSB/ MSBH/ MVH==/ QDM/
                SBJB/ TJMN/ TXT/ TXWT/ YPWN/
                '''.strip().split())
agentives = set('''
                >B/ >CH/ >DM/ >DRGZR/ >DWN/ >JC/ >J=/ >KR/ >LJL/ >LMN=/ >LMNH/ >LMNJ/ >LWH/ >LWP/ >M/ 
                >MH/ >MN==/ >MWN=/ >NC/ >NWC/ >PH/ >PRX/ >SJR/ >SJR=/ >SP/ >X/ >XCDRPN/
                >XWH/ >XWT/
                <BDH=/ <CWQ/ <D=/ <DH=/ <LMH/ <LWMJM/ <M/ <MD/ <MJT/ <QR=/ <R/ <WJL/ <WL/ <WL==/ <WLL/
                <WLL=/ <YRH/
                B<L/ B<LH/ BKJRH/ BKR/ BN/ BR/ BR===/ BT/ BTWLH/ BWQR/ BXRJM/ BXWN/ BXWR/
                CD==/ CDH/ CGL/ CKN/ CLCJM/ CLJC=/ CMRH=/ CPXH/ CW<R/ CWRR/
                DJG/ DWD/ DWDH/ DWG/ DWR/
                F<JR=/ FB/ FHD/ FR/ FRH/ FRJD/ FVN/
                GBJRH/ GBR/ GBR=/ GBRT/ GLB/ GNB/ GR/ GW==/ GWJ/ GZBR/
                HDBR/ 
                J<RH/ JBM/ JBMH/ JD<NJ/ JDDWT/ JLD/ JLDH/ JLJD/ JRJB/ JSWR/ JTWM/ JWYR/
                JYRJM/ 
                KCP=/ KHN/ KLH/ KMR/ KN<NJ=/ KNT/ KRM=/ KRWB/ KRWZ/
                L>M/ LHQH/ LMD/ LXNH/
                M<RMJM/ M>WRH/ MCBR/ MCJX/ MCM<T/ MCMR/ MCPXH/ MCQLT/ MD<=/ MD<T/ MG/
                MJNQT/ MKR=/ ML>K/ MLK/ MLKH/ MLKT/ MLX=/ MLYR/ MMZR/ MNZRJM/ MPLYT/ MYRJ/
                MPY=/ MQHL/ MQY<H/ MR</ MR>/ MSGR=/ MT/ MWRH/ MYBH=/
                N<R/ N<R=/ N<RH/ N<RWT/ N<WRJM/ NBJ>/ NBJ>H/ NCJN/ NFJ>/ NGJD/ NJN/ NKD/ 
                NKR/ NPC/ NPJLJM/ NQD/ NSJK/ NTJN/ 
                PLGC/ PLJL/ PLJV/ PLJV=/ PQJD/ PR<H/ PRC/ PRJY/ PRJY=/ PRTMJM/ PRZWN/ 
                PSJL/ PSL/ PVR/ PVRH/ PXH/ PXR/
                QBYH/ QCRJM/ QCT=/ QHL/ QHLH/ QHLT/ QJM/ QYJN/
                R<H=/ R<H==/ R<JH/ R<=/ R<WT/ R>H/ RB</ RB=/ RB==/ RBRBNJN/ RGMH/ RHB/ RKB=/
                RKJL/ RMH/ RQX==/ 
                SBL/ SPR=/ SRJS/ SRK/ SRNJM/ 
                T<RWBWT/ TLMJD/ TLT=/ TPTJ/ TR<=/ TRCT>/ TRTN/ TWCB/ TWL<H/ TWLDWT/ TWTX/
                VBX/ VBX=/ VBXH=/ VPSR/ VPXJM/
                WLD/
                XBL==/ XBL======/ XBR/ XBR=/ XBR==/ XBRH/ XBRT=/ XJ=/ XLC/ XM=/ XMWT/
                XMWY=/ XNJK/ XR=/ XRC/ XRC====/ XRP=/ XRVM/ XTN/ XTP/ XZH=/
                Y<JRH/ Y>Y>JM/ YJ/ YJD==/ YJR==/ YR=/ YRH=/ 
                ZKWR/ ZMR=/ ZR</
            '''.strip().split())

categoryMap = {'place':locatives, 'agent':agentives}
rdCategories = {}

for category, catList in categoryMap.items():
    for lex in catList:
        rdCategories[lex] = {'category':category}

## Additions:

In [5]:
# CAUTION: These additions are for a special project only. The categories may not be applicable for certain passages!

rdCategories.update({'VM>/' :{'category':'agent'},
                     'ZKR=/' :{'category':'agent'},
                     'BHMH/':{'category':'agent'}
                    }) 

In [6]:
with open('RoordaDykCategories.json','w') as outfile:
    json.dump(rdCategories, outfile)