-
Notifications
You must be signed in to change notification settings - Fork 2
Expand file tree
/
Copy pathmain.py
More file actions
82 lines (59 loc) · 3.05 KB
/
main.py
File metadata and controls
82 lines (59 loc) · 3.05 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
import argparse
import json
import os
import random
import csv
from typing import List
import numpy as np
import torch
from module.trainer import LearningEnv
def set_random_seed(seed: int):
random_seed = seed
torch.manual_seed(random_seed)
torch.backends.cudnn.deterministic = True
torch.backends.cudnn.benchmark = False
np.random.seed(random_seed)
random.seed(random_seed)
torch.cuda.manual_seed(random_seed)
torch.cuda.manual_seed_all(random_seed)
def parse_args() -> argparse.Namespace:
parser = argparse.ArgumentParser(description='This code is for ECPE task.')
# Training Environment
parser.add_argument('--gpus', default=[0])
parser.add_argument('--num_process', default=int(os.cpu_count() * 0.8), type=int)
parser.add_argument('--num_worker', default=6, type=int)
parser.add_argument('--port', default=1234, type=int)
parser.add_argument('--model_name', default='PRG_MoE')
parser.add_argument('--pretrained_model', default=None)
parser.add_argument('--test', default=False)
parser.add_argument('--split_directory', default=None)
parser.add_argument('--train_data', default="data/data_fold/data_0/dailydialog_train.json")
parser.add_argument('--valid_data', default="data/data_fold/data_0/dailydialog_valid.json")
parser.add_argument('--test_data', default="data/data_fold/data_0/dailydialog_test.json")
parser.add_argument('--log_directory', default='logs', type=str)
parser.add_argument('--data_label', help='the label that attaches to saved model', default='dailydialog_fold_0')
parser.add_argument('--dropout', default=0.5, type=float)
parser.add_argument('--n_speaker', help='the number of speakers', default=2, type=int)
parser.add_argument('--n_emotion', help='the number of emotions', default=7, type=int)
parser.add_argument('--n_cause', help='the number of causes', default=2, type=int)
parser.add_argument('--n_expert', help='the number of causes', default=4, type=int)
parser.add_argument('--guiding_lambda', help='the mixing ratio', default=0.6, type=float)
parser.add_argument('--max_seq_len', help='the max length of each tokenized utterance', default=75, type=int)
parser.add_argument('--contain_context', help='While tokenizing, previous utterances are contained or not', default=False)
parser.add_argument('--training_iter', default=40, type=int)
parser.add_argument('--batch_size', default=5, type=int)
parser.add_argument('--learning_rate', default=5e-5, type=float)
parser.add_argument('--patience', help='patience for Early Stopping', default=None, type=int)
return parser.parse_args()
def test_preconditions(args: argparse.Namespace):
if args.test:
assert args.pretrained_model is not None, "For test, you should load pretrained model."
def main():
args = parse_args()
test_preconditions(args)
set_random_seed(77)
os.environ["CUDA_VISIBLE_DEVICES"] = ",".join([str(_) for _ in args.gpus])
trainer = LearningEnv(**vars(args))
trainer.run(**vars(args))
if __name__ == "__main__":
main()