-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy pathtask_config.py
98 lines (96 loc) · 4.69 KB
/
task_config.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
stand_task_config_dir = {
"20news":
{
"epochs": "1", "lr": "5e-3", "wd": "0.0001",
"lstm_dropout": "0.5", "num_layers": "1",
"embedding_file": "glove.6B.300d.txt", "embedding_dropout": "0.0",
"do_remove_stop_words": "True", "do_remove_low_freq_words": "5",
"batch_size": "32", "max_seq_len": "512", "hidden_size": "300",
"comm_round": "100", "num_filter": "192", "cnn_dropout": "0.1"
},
"agnews":
{
"epochs": "1", "lr": "5e-3", "wd": "0.0001",
"lstm_dropout": "0.1", "num_layers": "1",
"embedding_file": "glove.6B.300d.txt", "embedding_dropout": "0.0",
"do_remove_stop_words": "False", "do_remove_low_freq_words": "0",
"batch_size": "128", "max_seq_len": "128", "hidden_size": "300",
"comm_round": "100", "num_filter": "192", "cnn_dropout": "0.1"
},
"sst_2":
{
"epochs": "1", "lr": "5e-3", "wd": "0.0001",
"lstm_dropout": "0.5", "hidden_size": "300", "num_layers": "1",
"embedding_file": "glove.840B.300d.txt", "embedding_dropout": "0.3",
"do_remove_stop_words": "False", "do_remove_low_freq_words": "0",
"batch_size": "400", "max_seq_len": "32",
"comm_round": "100", "num_filter": "192", "cnn_dropout": "0.1"
},
}
tune_task_config_dir = {
"20news":
{
"epochs": "10", "lr": "5e-3", "wd": "0.0001",
"lstm_dropout": "0.5",
"embedding_file": "glove.6B.300d.txt", "embedding_dropout": "0.0",
"do_remove_stop_words": "True", "do_remove_low_freq_words": "5",
"batch_size": "400", "max_seq_len": "512",
"comm_round": "100", "ci": "1", "num_filter": "50", "cnn_dropout": "0.5"
},
"agnews":
{
"epochs": "10", "lr": "5e-3", "wd": "0.0001",
"lstm_dropout": "0.1",
"embedding_file": "glove.6B.300d.txt", "embedding_dropout": "0.0",
"do_remove_stop_words": "False", "do_remove_low_freq_words": "0",
"batch_size": "256", "max_seq_len": "128",
"comm_round": "60", "ci": "1", "num_filter": "50", "cnn_dropout": "0.1"
},
"sst_2":
{
"epochs": "1", "lr": "5e-3", "wd": "0.0001",
"lstm_dropout": "0.5",
"embedding_file": "glove.840B.300d.txt", "embedding_dropout": "0.3",
"do_remove_stop_words": "False", "do_remove_low_freq_words": "0",
"batch_size": "400", "max_seq_len": "32",
"comm_round": "150", "ci": "1", "num_filter": "50", "cnn_dropout": "0.5"
},
}
tlm_task_config_dir = {
"20news":
{
"distilbert": {"epochs": "1", "lr": "5e-5", "weight_decay": "0.0",
"train_batch_size": "32", "eval_batch_size": "200",
"max_seq_len": "256", "comm_round": "100"},
"bert": {"epochs": "1", "lr": "5e-5", "weight_decay": "0.0",
"train_batch_size": "32", "eval_batch_size": "200",
"max_seq_len": "256", "comm_round": "100"},
"albert": {"epochs": "1", "lr": "5e-5", "weight_decay": "0.0",
"train_batch_size": "64", "eval_batch_size": "64",
"max_seq_len": "256", "comm_round": "100"},
},
"agnews":
{
"albert": {"epochs": "2", "lr": "5e-5", "weight_decay": "0.0",
"train_batch_size": "64", "eval_batch_size": "200",
"max_seq_len": "128", "comm_round": "100", },
"bert": {"epochs": "2", "lr": "5e-5", "weight_decay": "0.0",
"train_batch_size": "64", "eval_batch_size": "200",
"max_seq_len": "128", "comm_round": "100", },
"distilbert": {"epochs": "2", "lr": "5e-5", "weight_decay": "0.0",
"train_batch_size": "64", "eval_batch_size": "200",
"max_seq_len": "128", "comm_round": "100"},
},
"sst_2":
{
"albert": {"epochs": "3", "lr": "5e-5", "weight_decay": "0.0",
"train_batch_size": "256", "eval_batch_size": "128",
"max_seq_len": "32", "comm_round": "100", },
"bert": {"epochs": "3", "lr": "5e-5", "weight_decay": "0.0",
"train_batch_size": "256", "eval_batch_size": "200",
"max_seq_len": "32", "comm_round": "100", },
"distilbert": {"epochs": "3", "lr": "5e-5", "weight_decay": "0.0",
"train_batch_size": "256", "eval_batch_size": "128",
"max_seq_len": "32", "comm_round": "100", },
},
}