-
Notifications
You must be signed in to change notification settings - Fork 3
/
utils.py
43 lines (40 loc) · 6.32 KB
/
utils.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
import torch
EDGE_LABELS = {"EQUAL": 0, "INCLUDED": 1, "INCLUDE": 2, "BEFORE": 3, "AFTER": 4, "SELF_LOOP": 5, "Agent": 6, "Beneficiary": 7, "Destination": 8, "Target": 9, "Attacker": 10, "Crime": 11, "Sentence": 12, "Entity": 13, "Org": 14, "Time-Before": 15, "Buyer": 16, "Seller": 17, "Place": 18, "Time-At-End": 19, "Time-At-Beginning": 20, "Artifact": 21, "Time-Within": 22, "Adjudicator": 23, "Vehicle": 24, "Position": 25, "Prosecutor": 26, "Money": 27, "Time-Starting": 28, "Price": 29, "Plaintiff": 30, "Victim": 31, "Time-Holds": 32, "Time-After": 33, "Recipient": 34, "Origin": 35, "Person": 36, "Instrument": 37, "Defendant": 38, "Time-Ending": 39, "Giver": 40}
TRAIN_DOCS = ['CNN_CF_20030303.1900.02', 'CNN_IP_20030405.1600.01-1', 'CNN_IP_20030409.1600.02',
'CNNHL_ENG_20030304_142751.10', 'CNN_ENG_20030328_150609.10', 'CNN_ENG_20030424_070008.15',
'AGGRESSIVEVOICEDAILY_20041116.1347', 'FLOPPINGACES_20050217.1237.014', 'TTRACY_20050223.1049',
'AGGRESSIVEVOICEDAILY_20041116.1347', 'AGGRESSIVEVOICEDAILY_20041101.1144',
'AGGRESSIVEVOICEDAILY_20041101.1806', 'AGGRESSIVEVOICEDAILY_20041201.2313',
'AGGRESSIVEVOICEDAILY_20041203.1959', 'AGGRESSIVEVOICEDAILY_20041208.2133',
'AGGRESSIVEVOICEDAILY_20041215.2302', 'AGGRESSIVEVOICEDAILY_20041218.1004',
'AGGRESSIVEVOICEDAILY_20041223.1449', 'AGGRESSIVEVOICEDAILY_20041226.1712',
'AGGRESSIVEVOICEDAILY_20050106.1310', 'AFP_ENG_20030304.0250', 'AFP_ENG_20030314.0238',
'AFP_ENG_20030327.0022', 'AFP_ENG_20030401.0476', 'AFP_ENG_20030413.0098', 'AFP_ENG_20030415.0734',
'AFP_ENG_20030417.0764', 'AFP_ENG_20030427.0118', 'AFP_ENG_20030429.0007', 'AFP_ENG_20030430.0075',
'AFP_ENG_20030502.0614', 'AFP_ENG_20030508.0357', 'AFP_ENG_20030519.0049', 'AFP_ENG_20030522.0878',
'AFP_ENG_20030527.0616', 'AFP_ENG_20030528.0561', 'AFP_ENG_20030607.0030', 'AFP_ENG_20030625.0057',
'APW_ENG_20030304.0555', 'APW_ENG_20030306.0191', 'APW_ENG_20030308.0314', 'APW_ENG_20030318.0689',
'APW_ENG_20030324.0768', 'AFP_ENG_20030323.0020', 'AFP_ENG_20030330.0211', 'APW_ENG_20030326.0190',
'APW_ENG_20030403.0862', 'rec.games.chess.politics_20041216.1047']
DEV_DOCS = ['CNN_IP_20030329.1600.00-2', 'CNNHL_ENG_20030424_123502.25', 'CNN_ENG_20030620_085840.7',
'FLOPPINGACES_20041117.2002.024', 'AGGRESSIVEVOICEDAILY_20050208.1142',
'AGGRESSIVEVOICEDAILY_20050213.2123', 'AGGRESSIVEVOICEDAILY_20050224.1207',
'AGGRESSIVEVOICEDAILY_20050224.2252', 'AFP_ENG_20030305.0918', 'AFP_ENG_20030319.0879',
'AFP_ENG_20030417.0004', 'AFP_ENG_20030418.0556', 'AFP_ENG_20030504.0248', 'AFP_ENG_20030509.0345',
'AFP_ENG_20030530.0132', 'AFP_ENG_20030616.0715', 'APW_ENG_20030310.0719', 'APW_ENG_20030319.0545',
'APW_ENG_20030327.0376']
TEST_DOCS = ['CNN_IP_20030402.1600.00-1', 'CNNHL_ENG_20030513_220910.32', 'CNN_ENG_20030304_173120.16',
'CNN_ENG_20030512_170454.13', 'FLOPPINGACES_20050203.1953.038', 'AGGRESSIVEVOICEDAILY_20050107.2012',
'AGGRESSIVEVOICEDAILY_20050113.1400', 'AGGRESSIVEVOICEDAILY_20050116.2149',
'AGGRESSIVEVOICEDAILY_20050124.1354', 'AGGRESSIVEVOICEDAILY_20050203.1356',
'AGGRESSIVEVOICEDAILY_20050205.1954', 'AFP_ENG_20030311.0491', 'AFP_ENG_20030320.0722',
'AFP_ENG_20030327.0224', 'AFP_ENG_20030417.0307', 'AFP_ENG_20030425.0408', 'AFP_ENG_20030428.0720',
'AFP_ENG_20030508.0118', 'AFP_ENG_20030514.0706', 'AFP_ENG_20030519.0372', 'AFP_ENG_20030601.0262',
'AFP_ENG_20030617.0846', 'AFP_ENG_20030630.0271', 'APW_ENG_20030311.0775', 'APW_ENG_20030322.0119',
'APW_ENG_20030325.0786', 'APW_ENG_20030331.0410']
added_train = ['APW_ENG_20030519.0367', 'APW_ENG_20030424.0698', 'CNNHL_ENG_20030604_230238.5', 'APW_ENG_20030610.0010', 'CNNHL_ENG_20030505_220734.25', 'CNNHL_ENG_20030526_221156.39', 'CNN_ENG_20030401_233449.5', 'CNN_ENG_20030403_090032.1', 'APW_ENG_20030416.0581', 'APW_ENG_20030502.0686', 'CNNHL_ENG_20030425_183518.12', 'CNN_ENG_20030327_163556.20', 'CNNHL_ENG_20030624_230338.34', 'APW_ENG_20030415.0742', 'APW_ENG_20030502.0470', 'APW_ENG_20030417.0555', 'CNNHL_ENG_20030625_230351.4', 'CNNHL_ENG_20030416_193742.7', 'APW_ENG_20030520.0757', 'CNNHL_ENG_20030523_221118.14', 'CNN_ENG_20030305_170125.1', 'APW_ENG_20030411.0304', 'CNN_ENG_20030403_060032.0', 'CNNHL_ENG_20030416_133739.13', 'APW_ENG_20030419.0358', 'CNNHL_ENG_20030625_193346.7', 'CNN_ENG_20030402_190500.11', 'CNN_ENG_20030320_153434.7', 'CNN_ENG_20030325_220534.6', 'CNN_ENG_20030318_140851.8', 'CNNHL_ENG_20030428_123600.14', 'APW_ENG_20030619.0383', 'CNNHL_ENG_20030603_230307.3', 'CNNHL_ENG_20030429_220618.15', 'APW_ENG_20030412.0531', 'CNNHL_ENG_20030416_133739.9', 'CNNHL_ENG_20030416_193742.26', 'APW_ENG_20030422.0469', 'APW_ENG_20030407.0030', 'CNNHL_ENG_20030519_124020.23', 'CNN_ENG_20030325_150531.10', 'APW_ENG_20030424.0532', 'APW_ENG_20030610.0554', 'CNN_ENG_20030403_080032.9']
added_dev = ['APW_ENG_20030422.0485', 'CNNHL_ENG_20030312_150218.13', 'APW_ENG_20030409.0013', 'CNNHL_ENG_20030402_193443.5', 'APW_ENG_20030508.0772', 'CNNHL_ENG_20030331_193419.9', 'CNNHL_ENG_20030402_133449.22', 'CNNHL_ENG_20030610_230438.14', 'APW_ENG_20030513.0139', 'APW_ENG_20030404.0439', 'APW_ENG_20030408.0090', 'CNNHL_ENG_20030403_133453.21', 'CNN_ENG_20030331_123648.4', 'APW_ENG_20030527.0232', 'CNNHL_ENG_20030403_193455.30', 'CNNHL_ENG_20030610_133347.6', 'CNNHL_ENG_20030609_133335.37', 'CNN_ENG_20030306_070606.18', 'CNN_ENG_20030329_170349.7', 'CNNHL_ENG_20030513_183907.5']
added_test = ['APW_ENG_20030510.0228', 'CNN_ENG_20030306_083604.6', 'CNN_ENG_20030331_193655.14', 'CNNHL_ENG_20030618_230303.36', 'CNNHL_ENG_20030618_230303.6', 'CNN_ENG_20030401_073033.14', 'APW_ENG_20030520.0081', 'APW_ENG_20030406.0191', 'APW_ENG_20030418.0084', 'CNNHL_ENG_20030611_133445.24', 'CNNHL_ENG_20030411_230640.38', 'CNN_ENG_20030312_083725.3', 'CNNHL_ENG_20030616_230155.7', 'CNNHL_ENG_20030513_220910.11', 'APW_ENG_20030519.0548', 'APW_ENG_20030410.0906', 'CNNHL_ENG_20030410_193626.13', 'APW_ENG_20030423.0079', 'CNNHL_ENG_20030624_133331.33', 'CNNHL_ENG_20030415_193729.5', 'CNN_ENG_20030312_223733.14', 'CNNHL_ENG_20030616_230155.28', 'APW_ENG_20030602.0037', 'APW_ENG_20030603.0303']
TRAIN_DOCS += added_train
DEV_DOCS += added_dev
TEST_DOCS += added_test