-
Notifications
You must be signed in to change notification settings - Fork 0
/
train_puls_model.sh
executable file
·36 lines (23 loc) · 1.3 KB
/
train_puls_model.sh
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
#! /bin/bash
#./run_feature_experiment 1+2+3 upper train_path test_path
feature_ids=1+2+3+4+5+6
train_path="/cs/taatto/home/hxiao/capitalization-recovery/data/puls-100k/train.txt"
test_path="/cs/taatto/home/hxiao/capitalization-recovery/data/puls-100k/test.txt"
result_dir="/cs/taatto/home/hxiao/capitalization-recovery/result/puls-100k"
suffix=''
if [ ! -d $result_dir ]; then
mkdir -p $result_dir
fi
cd ~/code/capitalization_train/
cat $train_path | python crfsuite-0.12/example/chunking.py $feature_ids > $result_dir/train.crfsuite-${suffix}.txt
# cat $test_path | python crfsuite-0.12/example/chunking.py $feature_ids > $result_dir/test.crfsuite.txt
# ./crfsuite-0.12/bin/crfsuite learn -e2 ${result_dir}/train.crfsuite.txt ${result_dir}/test.crfsuite.txt > ${result_dir}/result-dev.txt
## The following line is used for cross validation
# ./crfsuite-0.12/bin/crfsuite learn -g10 -x -l $result_dir/train.crfsuite-${suffix}.txt > $result_dir/cross_validation-${suffix}.txt
## You might need to use all the data for model training after cross validation
## The following does that
./crfsuite-0.12/bin/crfsuite learn -m $result_dir/model-${suffix} $result_dir/train.crfsuite-${suffix}.txt
# remove train data to save space
# rm $result_dir/train.crfsuite.txt
# rm $result_dir/model
# rm $result_dir/test.crfsuite.txt