-
Notifications
You must be signed in to change notification settings - Fork 21
/
Copy pathdeepblast-evaluate
61 lines (53 loc) · 2.04 KB
/
deepblast-evaluate
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
#!/usr/bin/env python3
import argparse
import os
import pandas as pd
import torch
from pytorch_lightning import Trainer
from transformers import T5EncoderModel, T5Tokenizer
from deepblast.trainer import DeepBLAST
def main(args):
print('args', args)
tokenizer = T5Tokenizer.from_pretrained(
args.pretrain_path, do_lower_case=False)
lm = T5EncoderModel.from_pretrained(args.pretrain_path)
model = DeepBLAST.load_from_checkpoint(
args.load_from_checkpoint, lm=lm, tokenizer=tokenizer,
alignment_mode=args.alignment_mode)
if args.accelerator == 'gpu':
model = model.cuda()
trainer = Trainer(
max_epochs=args.epochs,
gpus=args.gpus,
num_nodes=args.nodes,
distributed_backend=args.backend,
precision=args.precision,
# check_val_every_n_epoch=1,
val_check_interval=0.25,
fast_dev_run=False,
# auto_scale_batch_size='power',
# profiler=profiler,
)
# something weird is going on with the test function
test_res = trainer.test(model)
fname = os.path.basename(args.test_pairs)
test_res = list(map(pd.DataFrame, test_res))
test_res = pd.concat(test_res, axis=0)
test_res.to_csv(
f'{args.output_directory}/{fname}-results.csv'
)
if __name__ == '__main__':
parser = argparse.ArgumentParser(add_help=False)
parser.add_argument('--accelerator', type=str, default='cpu')
parser.add_argument('--gpus', type=int, default=None)
parser.add_argument('--num-workers', type=int, default=1)
parser.add_argument('--nodes', type=int, default=1)
parser.add_argument('--load-from-checkpoint', type=str, default=None)
parser.add_argument('--pretrain-path', type=str, default=None,
help="Path to pretrained model.")
parser.add_argument('--precision', type=int, default=32)
parser.add_argument('--backend', type=str, default=None)
# options include ddp_cpu, dp, ddp
parser = DeepBLAST.add_model_specific_args(parser)
hparams = parser.parse_args()
main(hparams)