-
Notifications
You must be signed in to change notification settings - Fork 1
/
ablation.sh
162 lines (145 loc) · 15.1 KB
/
ablation.sh
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
# default ----------
python generate_samples.py --neutral-thresh 0.2 --dataset cdip --max-samples 1000 --sample-size 32 32 --save-dir ~/samples_v3/cdip_0.2_1000_32x32
python train.py --model-id cdip_0.2_1000_32x32 --samples-dir ~/samples_v3/cdip_0.2_1000_32x32
python -m ablation.run --dataset D1 --model-id cdip_0.2_1000_32x32 --results-id D1_0.2_1000_32x32_10 --input-size 3000 32 --vshift 10 --max-ndocs 5
python -m ablation.run --dataset D2 --model-id cdip_0.2_1000_32x32 --results-id D2_0.2_1000_32x32_10 --input-size 3000 32 --vshift 10 --max-ndocs 5
python generate_samples.py --neutral-thresh 0.2 --dataset isri-ocr --max-samples 1000 --sample-size 32 32 --save-dir ~/samples_v3/isri-ocr_0.2_1000_32x32
python train.py --model-id isri-ocr_0.2_1000_32x32 --samples-dir ~/samples_v3/isri-ocr_0.2_1000_32x32
python -m ablation.run --dataset cdip --model-id isri-ocr_0.2_1000_32x32 --results-id cdip_0.2_1000_32x32_10 --input-size 3000 32 --vshift 10 --max-ndocs 5
# others ----------
# neutral_thresh=0.1
python generate_samples.py --neutral-thresh 0.1 --dataset cdip --max-samples 1000 --sample-size 32 32 --save-dir ~/samples_v3/cdip_0.1_1000_32x32
python train.py --model-id cdip_0.1_1000_32x32 --samples-dir ~/samples_v3/cdip_0.1_1000_32x32
rm -rf ~/samples_v3/cdip_0.1_1000_32x32
python -m ablation.run --dataset D1 --model-id cdip_0.1_1000_32x32 --results-id D1_0.1_1000_32x32_10 --input-size 3000 32 --vshift 10 --max-ndocs 5
python -m ablation.run --dataset D2 --model-id cdip_0.1_1000_32x32 --results-id D2_0.1_1000_32x32_10 --input-size 3000 32 --vshift 10 --max-ndocs 5
python generate_samples.py --neutral-thresh 0.1 --dataset isri-ocr --max-samples 1000 --sample-size 32 32 --save-dir ~/samples_v3/isri-ocr_0.1_1000_32x32
python train.py --model-id isri-ocr_0.1_1000_32x32 --samples-dir ~/samples_v3/isri-ocr_0.1_1000_32x32
rm -rf ~/samples_v3/isri-ocr_0.1_1000_32x32
python -m ablation.run --dataset cdip --model-id isri-ocr_0.1_1000_32x32 --results-id cdip_0.1_1000_32x32_10 --input-size 3000 32 --vshift 10 --max-ndocs 5
# neutral_thresh=0.3
python generate_samples.py --neutral-thresh 0.3 --dataset cdip --max-samples 1000 --sample-size 32 32 --save-dir ~/samples_v3/cdip_0.3_1000_32x32
python train.py --model-id cdip_0.3_1000_32x32 --samples-dir ~/samples_v3/cdip_0.3_1000_32x32
rm -rf ~/samples_v3/cdip_0.3_1000_32x32
python -m ablation.run --dataset D1 --model-id cdip_0.3_1000_32x32 --results-id D1_0.3_1000_32x32_10 --input-size 3000 32 --vshift 10 --max-ndocs 5
python -m ablation.run --dataset D2 --model-id cdip_0.3_1000_32x32 --results-id D2_0.3_1000_32x32_10 --input-size 3000 32 --vshift 10 --max-ndocs 5
python generate_samples.py --neutral-thresh 0.3 --dataset isri-ocr --max-samples 1000 --sample-size 32 32 --save-dir ~/samples_v3/isri-ocr_0.3_1000_32x32
python train.py --model-id isri-ocr_0.3_1000_32x32 --samples-dir ~/samples_v3/isri-ocr_0.3_1000_32x32
rm -rf ~/samples_v3/isri-ocr_0.3_1000_32x32
python -m ablation.run --dataset cdip --model-id isri-ocr_0.3_1000_32x32 --results-id cdip_0.3_1000_32x32_10 --input-size 3000 32 --vshift 10 --max-ndocs 5
# max_samples=500
python generate_samples.py --neutral-thresh 0.2 --dataset cdip --max-samples 500 --sample-size 32 32 --save-dir ~/samples_v3/cdip_0.2_500_32x32
python train.py --model-id cdip_0.2_500_32x32 --samples-dir ~/samples_v3/cdip_0.2_500_32x32
rm -rf ~/samples_v3/cdip_0.2_500_32x32
python -m ablation.run --dataset D1 --model-id cdip_0.2_500_32x32 --results-id D1_0.2_500_32x32_10 --input-size 3000 32 --vshift 10 --max-ndocs 5
python -m ablation.run --dataset D2 --model-id cdip_0.2_500_32x32 --results-id D2_0.2_500_32x32_10 --input-size 3000 32 --vshift 10 --max-ndocs 5
python generate_samples.py --neutral-thresh 0.2 --dataset isri-ocr --max-samples 500 --sample-size 32 32 --save-dir ~/samples_v3/isri-ocr_0.2_500_32x32
python train.py --model-id isri-ocr_0.2_500_32x32 --samples-dir ~/samples_v3/isri-ocr_0.2_500_32x32
rm -rf ~/samples_v3/isri-ocr_0.2_500_32x32
python -m ablation.run --dataset cdip --model-id isri-ocr_0.2_500_32x32 --results-id cdip_0.2_500_32x32_10 --input-size 3000 32 --vshift 10 --max-ndocs 5
# max_samples=1500
python generate_samples.py --neutral-thresh 0.2 --dataset cdip --max-samples 1500 --sample-size 32 32 --save-dir ~/samples_v3/cdip_0.2_1500_32x32
python train.py --model-id cdip_0.2_1500_32x32 --samples-dir ~/samples_v3/cdip_0.2_1500_32x32
rm -rf ~/samples_v3/cdip_0.2_1500_32x32
python -m ablation.run --dataset D1 --model-id cdip_0.2_1500_32x32 --results-id D1_0.2_1500_32x32_10 --input-size 3000 32 --vshift 10 --max-ndocs 5
python -m ablation.run --dataset D2 --model-id cdip_0.2_1500_32x32 --results-id D2_0.2_1500_32x32_10 --input-size 3000 32 --vshift 10 --max-ndocs 5
python generate_samples.py --neutral-thresh 0.2 --dataset isri-ocr --max-samples 1500 --sample-size 32 32 --save-dir ~/samples_v3/isri-ocr_0.2_1500_32x32
python train.py --model-id isri-ocr_0.2_1500_32x32 --samples-dir ~/samples_v3/isri-ocr_0.2_1500_32x32
rm -rf ~/samples_v3/isri-ocr_0.2_1500_32x32
python -m ablation.run --dataset cdip --model-id isri-ocr_0.2_1500_32x32 --results-id cdip_0.2_1500_32x32_10 --input-size 3000 32 --vshift 10 --max-ndocs 5
# sample_size=32x48
python generate_samples.py --neutral-thresh 0.2 --dataset cdip --max-samples 1000 --sample-size 32 48 --save-dir ~/samples_v3/cdip_0.2_1000_32x48
python train.py --model-id cdip_0.2_1000_32x48 --samples-dir ~/samples_v3/cdip_0.2_1000_32x48
rm -rf ~/samples_v3/cdip_0.2_1000_32x48
python -m ablation.run --dataset D1 --model-id cdip_0.2_1000_32x48 --results-id D1_0.2_1000_32x48_10 --input-size 3000 48 --vshift 10 --max-ndocs 5
python -m ablation.run --dataset D2 --model-id cdip_0.2_1000_32x48 --results-id D2_0.2_1000_32x48_10 --input-size 3000 48 --vshift 10 --max-ndocs 5
python generate_samples.py --neutral-thresh 0.2 --dataset isri-ocr --max-samples 1000 --sample-size 32 48 --save-dir ~/samples_v3/isri-ocr_0.2_1000_32x48
python train.py --model-id isri-ocr_0.2_1000_32x48 --samples-dir ~/samples_v3/isri-ocr_0.2_1000_32x48
rm -rf ~/samples_v3/isri-ocr_0.2_1000_32x48
python -m ablation.run --dataset cdip --model-id isri-ocr_0.2_1000_32x48 --results-id cdip_0.2_1000_32x48_10 --input-size 3000 48 --vshift 10 --max-ndocs 5
# sample_size=32x64
python generate_samples.py --neutral-thresh 0.2 --dataset cdip --max-samples 1000 --sample-size 32 64 --save-dir ~/samples_v3/cdip_0.2_1000_32x64
python train.py --model-id cdip_0.2_1000_32x64 --samples-dir ~/samples_v3/cdip_0.2_1000_32x64
rm -rf ~/samples_v3/cdip_0.2_1000_32x64
python -m ablation.run --dataset D1 --model-id cdip_0.2_1000_32x64 --results-id D1_0.2_1000_32x64_10 --input-size 3000 64 --vshift 10 --max-ndocs 5
python -m ablation.run --dataset D2 --model-id cdip_0.2_1000_32x64 --results-id D2_0.2_1000_32x64_10 --input-size 3000 64 --vshift 10 --max-ndocs 5
python generate_samples.py --neutral-thresh 0.2 --dataset isri-ocr --max-samples 1000 --sample-size 32 64 --save-dir ~/samples_v3/isri-ocr_0.2_1000_32x64
python train.py --model-id isri-ocr_0.2_1000_32x64 --samples-dir ~/samples_v3/isri-ocr_0.2_1000_32x64
rm -rf ~/samples_v3/isri-ocr_0.2_1000_32x64
python -m ablation.run --dataset cdip --model-id isri-ocr_0.2_1000_32x64 --results-id cdip_0.2_1000_32x64_10 --input-size 3000 64 --vshift 10 --max-ndocs 5
# sample_size=48x32
python generate_samples.py --neutral-thresh 0.2 --dataset cdip --max-samples 1000 --sample-size 48 32 --save-dir ~/samples_v3/cdip_0.2_1000_48x32
python train.py --model-id cdip_0.2_1000_48x32 --samples-dir ~/samples_v3/cdip_0.2_1000_48x32
rm -rf ~/samples_v3/cdip_0.2_1000_48x32
python -m ablation.run --dataset D1 --model-id cdip_0.2_1000_48x32 --results-id D1_0.2_1000_48x32_10 --input-size 3000 32 --vshift 10 --max-ndocs 5
python -m ablation.run --dataset D2 --model-id cdip_0.2_1000_48x32 --results-id D2_0.2_1000_48x32_10 --input-size 3000 32 --vshift 10 --max-ndocs 5
python generate_samples.py --neutral-thresh 0.2 --dataset isri-ocr --max-samples 1000 --sample-size 48 32 --save-dir ~/samples_v3/isri-ocr_0.2_1000_48x32
python train.py --model-id isri-ocr_0.2_1000_48x32 --samples-dir ~/samples_v3/isri-ocr_0.2_1000_48x32
rm -rf ~/samples_v3/isri-ocr_0.2_1000_48x32
python -m ablation.run --dataset cdip --model-id isri-ocr_0.2_1000_48x32 --results-id cdip_0.2_1000_48x32_10 --input-size 3000 32 --vshift 10 --max-ndocs 5
# sample_size=48x48
python generate_samples.py --neutral-thresh 0.2 --dataset cdip --max-samples 1000 --sample-size 48 48 --save-dir ~/samples_v3/cdip_0.2_1000_48x48
python train.py --model-id cdip_0.2_1000_48x48 --samples-dir ~/samples_v3/cdip_0.2_1000_48x48
rm -rf ~/samples_v3/cdip_0.2_1000_48x48
python -m ablation.run --dataset D1 --model-id cdip_0.2_1000_48x48 --results-id D1_0.2_1000_48x48_10 --input-size 3000 48 --vshift 10 --max-ndocs 5
python -m ablation.run --dataset D2 --model-id cdip_0.2_1000_48x48 --results-id D2_0.2_1000_48x48_10 --input-size 3000 48 --vshift 10 --max-ndocs 5
python generate_samples.py --neutral-thresh 0.2 --dataset isri-ocr --max-samples 1000 --sample-size 48 48 --save-dir ~/samples_v3/isri-ocr_0.2_1000_48x48
python train.py --model-id isri-ocr_0.2_1000_48x48 --samples-dir ~/samples_v3/isri-ocr_0.2_1000_48x48
rm -rf ~/samples_v3/isri-ocr_0.2_1000_48x48
python -m ablation.run --dataset cdip --model-id isri-ocr_0.2_1000_48x48 --results-id cdip_0.2_1000_48x48_10 --input-size 3000 48 --vshift 10 --max-ndocs 5
# sample_size=48x64
python generate_samples.py --neutral-thresh 0.2 --dataset cdip --max-samples 1000 --sample-size 48 64 --save-dir ~/samples_v3/cdip_0.2_1000_48x64
python train.py --model-id cdip_0.2_1000_48x64 --samples-dir ~/samples_v3/cdip_0.2_1000_48x64
rm -rf ~/samples_v3/cdip_0.2_1000_48x64
python -m ablation.run --dataset D1 --model-id cdip_0.2_1000_48x64 --results-id D1_0.2_1000_48x64_10 --input-size 3000 64 --vshift 10 --max-ndocs 5
python -m ablation.run --dataset D2 --model-id cdip_0.2_1000_48x64 --results-id D2_0.2_1000_48x64_10 --input-size 3000 64 --vshift 10 --max-ndocs 5
python generate_samples.py --neutral-thresh 0.2 --dataset isri-ocr --max-samples 1000 --sample-size 48 64 --save-dir ~/samples_v3/isri-ocr_0.2_1000_48x64
python train.py --model-id isri-ocr_0.2_1000_48x64 --samples-dir ~/samples_v3/isri-ocr_0.2_1000_48x64
rm -rf ~/samples_v3/isri-ocr_0.2_1000_48x64
python -m ablation.run --dataset cdip --model-id isri-ocr_0.2_1000_48x64 --results-id cdip_0.2_1000_48x64_10 --input-size 3000 64 --vshift 10 --max-ndocs 5
# sample_size=64x32
python generate_samples.py --neutral-thresh 0.2 --dataset cdip --max-samples 1000 --sample-size 64 32 --save-dir ~/samples_v3/cdip_0.2_1000_64x32
python train.py --model-id cdip_0.2_1000_64x32 --samples-dir ~/samples_v3/cdip_0.2_1000_64x32
rm -rf ~/samples_v3/cdip_0.2_1000_64x32
python -m ablation.run --dataset D1 --model-id cdip_0.2_1000_64x32 --results-id D1_0.2_1000_64x32_10 --input-size 3000 32 --vshift 10 --max-ndocs 5
python -m ablation.run --dataset D2 --model-id cdip_0.2_1000_64x32 --results-id D2_0.2_1000_64x32_10 --input-size 3000 32 --vshift 10 --max-ndocs 5
python generate_samples.py --neutral-thresh 0.2 --dataset isri-ocr --max-samples 1000 --sample-size 64 32 --save-dir ~/samples_v3/isri-ocr_0.2_1000_64x32
python train.py --model-id isri-ocr_0.2_1000_64x32 --samples-dir ~/samples_v3/isri-ocr_0.2_1000_64x32
rm -rf ~/samples_v3/isri-ocr_0.2_1000_64x32
python -m ablation.run --dataset cdip --model-id isri-ocr_0.2_1000_64x32 --results-id cdip_0.2_1000_64x32_10 --input-size 3000 32 --vshift 10 --max-ndocs 5
# sample_size=64x48
python generate_samples.py --neutral-thresh 0.2 --dataset cdip --max-samples 1000 --sample-size 64 48 --save-dir ~/samples_v3/cdip_0.2_1000_64x48
python train.py --model-id cdip_0.2_1000_64x48 --samples-dir ~/samples_v3/cdip_0.2_1000_64x48
rm -rf ~/samples_v3/cdip_0.2_1000_64x48
python -m ablation.run --dataset D1 --model-id cdip_0.2_1000_64x48 --results-id D1_0.2_1000_64x48_10 --input-size 3000 48 --vshift 10 --max-ndocs 5
python -m ablation.run --dataset D2 --model-id cdip_0.2_1000_64x48 --results-id D2_0.2_1000_64x48_10 --input-size 3000 48 --vshift 10 --max-ndocs 5
python generate_samples.py --neutral-thresh 0.2 --dataset isri-ocr --max-samples 1000 --sample-size 64 48 --save-dir ~/samples_v3/isri-ocr_0.2_1000_64x48
python train.py --model-id isri-ocr_0.2_1000_64x48 --samples-dir ~/samples_v3/isri-ocr_0.2_1000_64x48
rm -rf ~/samples_v3/isri-ocr_0.2_1000_64x48
python -m ablation.run --dataset cdip --model-id isri-ocr_0.2_1000_64x48 --results-id cdip_0.2_1000_64x48_10 --input-size 3000 48 --vshift 10 --max-ndocs 5
# sample_size=64x64
python generate_samples.py --neutral-thresh 0.2 --dataset cdip --max-samples 1000 --sample-size 64 64 --save-dir ~/samples_v3/cdip_0.2_1000_64x64
python train.py --model-id cdip_0.2_1000_64x64 --samples-dir ~/samples_v3/cdip_0.2_1000_64x64
rm -rf ~/samples_v3/cdip_0.2_1000_64x64
python -m ablation.run --dataset D1 --model-id cdip_0.2_1000_64x64 --results-id D1_0.2_1000_64x64_10 --input-size 3000 64 --vshift 10 --max-ndocs 5
python -m ablation.run --dataset D2 --model-id cdip_0.2_1000_64x64 --results-id D2_0.2_1000_64x64_10 --input-size 3000 64 --vshift 10 --max-ndocs 5
python generate_samples.py --neutral-thresh 0.2 --dataset isri-ocr --max-samples 1000 --sample-size 64 64 --save-dir ~/samples_v3/isri-ocr_0.2_1000_64x64
python train.py --model-id isri-ocr_0.2_1000_64x64 --samples-dir ~/samples_v3/isri-ocr_0.2_1000_64x64
rm -rf ~/samples_v3/isri-ocr_0.2_1000_64x64
python -m ablation.run --dataset cdip --model-id isri-ocr_0.2_1000_64x64 --results-id cdip_0.2_1000_64x64_10 --input-size 3000 64 --vshift 10 --max-ndocs 5
# vshift=0
python -m ablation.run --dataset D1 --model-id cdip_0.2_1000_32x32 --results-id D1_0.2_1000_32x32_0 --input-size 3000 32 --vshift 0 --max-ndocs 5
python -m ablation.run --dataset D2 --model-id cdip_0.2_1000_32x32 --results-id D2_0.2_1000_32x32_0 --input-size 3000 32 --vshift 0 --max-ndocs 5
python -m ablation.run --dataset cdip --model-id isri-ocr_0.2_1000_32x32 --results-id cdip_0.2_1000_32x32_0 --input-size 3000 32 --vshift 0 --max-ndocs 5
# vshift=5
python -m ablation.run --dataset D1 --model-id cdip_0.2_1000_32x32 --results-id D1_0.2_1000_32x32_5 --input-size 3000 32 --vshift 5 --max-ndocs 5
python -m ablation.run --dataset D2 --model-id cdip_0.2_1000_32x32 --results-id D2_0.2_1000_32x32_5 --input-size 3000 32 --vshift 5 --max-ndocs 5
python -m ablation.run --dataset cdip --model-id isri-ocr_0.2_1000_32x32 --results-id cdip_0.2_1000_32x32_5 --input-size 3000 32 --vshift 5 --max-ndocs 5
# vshift=15
python -m ablation.run --dataset D1 --model-id cdip_0.2_1000_32x32 --results-id D1_0.2_1000_32x32_15 --input-size 3000 32 --vshift 15 --max-ndocs 5
python -m ablation.run --dataset D2 --model-id cdip_0.2_1000_32x32 --results-id D2_0.2_1000_32x32_15 --input-size 3000 32 --vshift 15 --max-ndocs 5
python -m ablation.run --dataset cdip --model-id isri-ocr_0.2_1000_32x32 --results-id cdip_0.2_1000_32x32_15 --input-size 3000 32 --vshift 15 --max-ndocs 5
# vshift=20
python -m ablation.run --dataset D1 --model-id cdip_0.2_1000_32x32 --results-id D1_0.2_1000_32x32_20 --input-size 3000 32 --vshift 20 --max-ndocs 5
python -m ablation.run --dataset D2 --model-id cdip_0.2_1000_32x32 --results-id D2_0.2_1000_32x32_20 --input-size 3000 32 --vshift 20 --max-ndocs 5
python -m ablation.run --dataset cdip --model-id isri-ocr_0.2_1000_32x32 --results-id cdip_0.2_1000_32x32_20 --input-size 3000 32 --vshift 20 --max-ndocs 5