-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathrun.py
More file actions
93 lines (77 loc) · 3.41 KB
/
run.py
File metadata and controls
93 lines (77 loc) · 3.41 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
from argparse import ArgumentParser
import os, shutil, torch, sys
import torch.distributed as dist
from separ import Parser, DEP_PARSERS, CON_PARSERS, SDP_PARSERS, TAGGERS
from separ.utils import Config, set_seed, filename, is_distributed
PARSERS = {_parser.NAME: _parser for _parser in DEP_PARSERS + SDP_PARSERS + CON_PARSERS + TAGGERS}
def setup():
device = int(os.environ['LOCAL_RANK'])
torch.cuda.set_device(device)
dist.init_process_group("nccl")
return device
def cleanup():
dist.destroy_process_group()
def build_parser(args, builder) -> Parser:
# load configuration
if args.conf:
conf = Config.from_ini(args.conf)
conf.update(vars(args))
else:
conf = None
if args.load:
try:
parser = builder.load(args.load, args.device)
return parser, conf
except:
pass
assert os.path.exists(args.conf), f'Configuration file does not exist: {args.conf}'
os.makedirs(args.output_folder, exist_ok=True)
shutil.copyfile(args.conf, f'{args.output_folder}/{filename(args.conf)}')
parser = builder.build(**conf, data=args.train)
return parser, conf
def run(parser, conf, args):
if args.mode == 'train':
conf['train_conf'].update(vars(args))
parser.train(**conf['train_conf'])
elif args.mode == 'eval':
parser.evaluate(args.input, **vars(args))
elif args.mode == 'predict':
parser.predict(args.input, **vars(args))
def add_run_args(argparser: ArgumentParser) -> ArgumentParser:
subparser = argparser.add_subparsers(title='Run mode', dest='mode')
train = subparser.add_parser('train')
evaluate = subparser.add_parser('eval')
predict = subparser.add_parser('predict')
# train parser
train.add_argument('--train', type=str, help='Path to train set')
train.add_argument('--dev', type=str, help='Path to dev set')
train.add_argument('--test', type=str, nargs='*', help='Path to test set')
train.add_argument('-o', '--output-folder', type=str, help='Folder to store training results')
train.add_argument('--batch-size', type=int, help='Training batch size')
train.add_argument('--run-name', type=str, default=None, help='Running name for wandb')
# eval parser
evaluate.add_argument('input', type=str, help='Evaluation dataset')
evaluate.add_argument('--output', type=str, help='Output folder to store metric')
evaluate.add_argument('--batch-size', type=int, default=500, help='Inference batch size')
# predict parser
predict.add_argument('input', type=str, help='Evaluation dataset')
predict.add_argument('output', type=str, help='Output dataset')
predict.add_argument('--batch-size', type=int, default=500, help='Inference batch size')
return argparser
def build_argparser(name: str) -> ArgumentParser:
argparser = ArgumentParser(description='Syntactic Parser')
argparser = Parser.add_arguments(argparser)
argparser = PARSERS[name].add_arguments(argparser)
argparser = add_run_args(argparser)
return argparser
if __name__ == '__main__':
_, name, *args = sys.argv
argparser = build_argparser(name)
args = argparser.parse_args(args)
set_seed(args.seed)
if is_distributed():
args.device = setup()
run(*build_parser(args, PARSERS[name]), args)
cleanup()
else:
run(*build_parser(args, PARSERS[name]), args)