-
Notifications
You must be signed in to change notification settings - Fork 1
/
test_result.txt
100 lines (88 loc) · 5.72 KB
/
test_result.txt
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
1.
tacred_supervised_li_fine_p10_bert_large_lora4_mk00_p10_bat2lib25_none
{"correct_num": 2012, "instance_num": 3325, "accuracy": 50.61, "total_accuracy": 60.51}
tacred_supervised_li_fine_p10_bert_large_lora4_mk00_p10_bat2lib25_t1
{"correct_num": 2640, "instance_num": 3325, "accuracy": 75.24, "total_accuracy": 79.4,
"correct_num_expert": 2689, "instance_num_expert": 3325, "accuracy_expert": 76.75, "total_accuracy_expert": 80.87}
tacred_supervised_li_fine_p10_bert_large_lora4_mk00_p10_bat2lib25_t2
{"correct_num": 2451, "instance_num": 3325, "accuracy": 67.64, "total_accuracy": 73.71,
"correct_num_expert": 2749, "instance_num_expert": 3325, "accuracy_expert": 79.55, "total_accuracy_expert": 82.68}
2. learning rate 0.0005
tacred_supervised_li_fine_p10_bert_large_lora4_mk00_p10_bat2lib50_t1
{"correct_num": 2750, "instance_num": 3325, "accuracy": 78.08, "total_accuracy": 82.71,
"correct_num_expert": 2830, "instance_num_expert": 3325, "accuracy_expert": 80.39, "total_accuracy_expert": 85.11}
tacred_supervised_li_fine_p10_bert_large_lora4_mk00_p10_bat2lib50_t2
{"correct_num": 2625, "instance_num": 3325, "accuracy": 75.12, "total_accuracy": 78.95,
"correct_num_expert": 2785, "instance_num_expert": 3325, "accuracy_expert": 79.84, "total_accuracy_expert": 83.76}
3. learning rate 0.0001
tacred_supervised_li_fine_p10_bert_large_lora4_mk00_p10_bat2lib50_t1_2
{"correct_num": 2418, "instance_num": 3325, "accuracy": 69.34, "total_accuracy": 72.72,
"correct_num_expert": 2542, "instance_num_expert": 3325, "accuracy_expert": 72.07, "total_accuracy_expert": 76.45}
tacred_supervised_li_fine_p10_bert_large_lora4_mk00_p10_bat2lib50_t2_2
{"correct_num": 2282, "instance_num": 3325, "accuracy": 62.97, "total_accuracy": 68.63,
"correct_num_expert": 2456, "instance_num_expert": 3325, "accuracy_expert": 70.7, "total_accuracy_expert": 73.86}
4. learning rate 0.001
tacred_supervised_li_fine_p10_bert_large_lora4_mk00_p10_bat2lib50_t1_3
{"correct_num": 2811, "instance_num": 3325, "accuracy": 79.31, "total_accuracy": 84.54,
"correct_num_expert": 2875, "instance_num_expert": 3325, "accuracy_expert": 81.22, "total_accuracy_expert": 86.47}
tacred_supervised_li_fine_p10_bert_large_lora4_mk00_p10_bat2lib50_t2_3
{"correct_num": 2611, "instance_num": 3325, "accuracy": 73.87, "total_accuracy": 78.53,
"correct_num_expert": 2872, "instance_num_expert": 3325, "accuracy_expert": 81.74, "total_accuracy_expert": 86.38}
TACRED top-1 expert 50 * 50 (3 replication)
"accuracy": 79.31, "total_accuracy": 84.54
"accuracy": 77.46, "total_accuracy": 82.71
"accuracy": 78.45, "total_accuracy": 82.14
TACRED top-2 expert 50 * 50
"accuracy": 75.12, "total_accuracy": 78.95
TACRED EMR 50 * 50 (3 replication)
"accuracy": 78.82, "total_accuracy": 83.61
"accuracy": 77.33, "total_accuracy": 81.26
"accuracy": 78.53, "total_accuracy": 82.11
TACRED top-1 expert 25 * 50
"accuracy": 75.24, "total_accuracy": 79.40
TACRED top-2 expert 25 * 50
"accuracy": 67.64, "total_accuracy": 73.71
TACRED all expert 25 * 50
"accuracy": 50.61, "total_accuracy": 60.51
TACRED top-1 expert whole
"accuracy": 80.98, "total_accuracy": 86.71,
TACRED all expert whole
"accuracy": 70.46, "total_accuracy": 78.71
BBN: ewc_e10_l1000, "accuracy": 9.79, "total_accuracy": 2.96
BBN: lwf_e10_l01, 'accuracy': 14.06, 'total_accuracy': 4.16, 0.01
BBN: lwf_e10_l001, 'accuracy': 10.99, 'total_accuracy': 3.26, 0.001
BBN: lwf_e10_l0d5, 'accuracy': 3.23, 'total_accuracy': 1.53
BBN: lwf_e10_l0d01, 'accuracy': 12.68, 'total_accuracy': 3.73
BBN: lwf_e10_l0d05, 'accuracy': 12.77, 'total_accuracy': 4.07
BBN: lwf_e10_l0d1, 'accuracy': 14.84, 'total_accuracy': 5.04
BBN: lwf_e5_l0d5, 'accuracy': 3.15, 'total_accuracy': 2.01
BBN: lwf_e5_l0d05, 'accuracy': 14.19, 'total_accuracy': 6.76
BBN: lwf_e5_l0d01, 'accuracy': 12.67, 'total_accuracy': 3.71
BBN: lwf_e5_l0d1, 'accuracy': 15.16, 'total_accuracy': 8.37
FewNERD: ewc_e5_l100, "accuracy": 10.07, "total_accuracy": 4.81
FewNERD: ewc_e5_l1000, 'accuracy': 21.44, 'total_accuracy': 12.67
FewNERD: ewc_e5_l5000, 'accuracy': 9.37, 'total_accuracy': 5.28
FewNERD: ewc_e5_l10000, "accuracy": 10.07, "total_accuracy": 4.81
FewNERD: lwf_e1_l10, "accuracy": 4.23, "total_accuracy": 4.16, 10.0
FewNERD: lwf_e3_l10, "accuracy": 2.48, "total_accuracy": 2.69, 10.0
FewNERD: lwf_e5_l10, "accuracy": 2.94, "total_accuracy": 4.04, 10.0
FewNERD: lwf_e5_l100, "accuracy": 2.21, "total_accuracy": 1.84, 100.0
FewNERD: lwf_e5_l0001, "accuracy": 17.56, "total_accuracy": 8.35, 0.0001
FewNERD: lwf_e5_l001, "accuracy": 17.76, "total_accuracy": 8.68, 0.01
FewNERD: lwf_e5_l01, "accuracy": 28.06, "total_accuracy": 16.9, 0.1
FewNERD: lwf_e5_l100, "accuracy": 2.2, "total_accuracy": 1.79, 100.0
FewNERD: lwf_e5_l10, "accuracy": 2.95, "total_accuracy": 4.07, 10.0
FewNERD: lwf_e5_l1, "accuracy": 6.3, "total_accuracy": 5.17, 1.0
OntoNotes: lwf_e5_l01, 'accuracy': 17.25, 'total_accuracy': 10.98, 0.01
OntoNotes: lwf_e5_l001, 'accuracy': 13.04, 'total_accuracy': 8.13, 0.001
OntoNotes: lwf_e5_l0d5, 'accuracy': 6.89, 'total_accuracy': 8.34
OntoNotes: lwf_e5_l0d1, 'accuracy': 24.88, 'total_accuracy': 19.13
OntoNotes: lwf_e5_l0d05, 'accuracy': 20.86, 'total_accuracy': 14.8
OntoNotes: lwf_e5_l0d01, 'accuracy': 17.25, 'total_accuracy': 10.98
FewRel: ewc_e5_l1000, 'accuracy': 12.7, 'total_accuracy': 12.7
FewRel: ewc_e5_l5000, 'accuracy': 18.23, 'total_accuracy': 18.23
FewRel: lwf_e5_l00001, "accuracy": 10.61, "total_accuracy": 10.61, 1.0e-05
FewRel: lwf_e5_l0001, "accuracy": 13.8, "total_accuracy": 13.8, 0.0001
FewRel: lwf_e5_l001, "accuracy": 13.23, "total_accuracy": 13.23, 0.001
FewRel: lwf_e5_l01, "accuracy": 19.8, "total_accuracy": 19.8, 0.01
python train_cycle.py --dataset_name ontonotes --use_selector 0 --teacher_forcing --batch_limit_policy 0 --cycle_suffix bat2liwhole_lwf_e5_l0d01 --method_type linear --continual_method lwf --seed 100 --device cuda:4 --start 1