-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathtrain.py
78 lines (68 loc) · 3.07 KB
/
train.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
import torch
import json
import pickle
import opennre
from opennre import encoder, model, framework
import argparse
import logging
logging.basicConfig(level=logging.INFO)
# Silent unimportant log messages
for logger_name in ['transformers.configuration_utils',
'transformers.modeling_utils',
'transformers.tokenization_utils_base']:
logging.getLogger(logger_name).setLevel(logging.WARNING)
# Training for wiki80 and tacred dataset
parser = argparse.ArgumentParser()
parser.add_argument('--model_path', '-m', type=str, required=True,
help='Full path for saving weights during training')
parser.add_argument('--encoder_name', '-e', choices=['bert', 'bertentity'], default='bert',
help=('Encoder model, choose from BERT (use [CLS] representation)'
' or BERT-entity (use concatenation of two entity representations)'))
parser.add_argument('--restore', action='store_true',
help='Whether to restore model weights from given model path')
parser.add_argument('--train_path', '-t', type=str, required=True,
help='Full path to file containing training data')
parser.add_argument('--valid_path', '-v', type=str, required=True,
help='Full path to file containing validation data')
parser.add_argument('--relation_path', '-r', type=str, required=True,
help='Full path to json file containing relation to index dict')
parser.add_argument('--num_epochs', '-n', type=int, default=10,
help='Number of training epochs')
parser.add_argument('--max_seq_len', '-l', type=int, default=128,
help='Maximum sequence length of bert model')
parser.add_argument('--batch_size', '-b', type=int, default=64,
help='Batch size for training and testing')
parser.add_argument('--metric', default='micro_f1', choices=['micro_f1', 'acc'],
help='Metric chosen for evaluation')
parser.add_argument('--pretrain_path', '-p', type=str,
help='Path to pretrained bert-base model weights')
args = parser.parse_args()
rel2id = json.load(open(args.relation_path))
# Define the sentence encoder
encoders = {'bert': encoder.BERTEncoder,
'bertentity': encoder.BERTEntityEncoder}
sentence_encoder = encoders[args.encoder_name.lower()](
max_length=args.max_seq_len,
pretrain_path=args.pretrain_path,
mask_entity=False
)
# Define the model
model = opennre.model.SoftmaxNN(sentence_encoder, len(rel2id), rel2id)
# Define the whole training framework
framework = opennre.framework.SentenceRE(
train_path=args.train_path,
val_path=args.valid_path,
test_path=args.valid_path,
model=model,
ckpt=args.model_path,
batch_size=args.batch_size,
max_epoch=args.num_epochs,
lr=2e-5,
opt='adamw'
)
# Restore from old model weights
if args.restore:
framework.load_state_dict(torch.load(args.model_path)['state_dict'])
logging.info('Restored model weights from {}'.format(args.model_path))
# Train the model
framework.train_model(args.metric)