-
Notifications
You must be signed in to change notification settings - Fork 0
/
finetune_best2010lm_bertlike12_s2s_sp_wisesight.json
76 lines (73 loc) · 1.78 KB
/
finetune_best2010lm_bertlike12_s2s_sp_wisesight.json
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
{
"model": {
"class": "SequenceTransferLearningWrapper",
"config": {
"output_class_num": 4,
"encoder_checkpoint": "_outputs_/benchmark_best2010lm_bertlike12_s2s_sp_trial_3/checkpoint/best_weight.h5",
"train_encoder": true,
"max_input_length": 256,
"drop_out": 0.4,
"cached_data_dir": "_cache_",
"encoder_model": {
"class": "BERTWrapper",
"config": {
"len_limit": 256,
"d_model": 512,
"d_inner_hid": 2048,
"n_head": 8,
"d_k": 512,
"d_v": 512,
"layers": 12,
"dropout": 0.1,
"share_word_emb": true,
"max_input_length": 256,
"max_mask_tokens": 80,
"cached_data_dir": "_cache_"
}
},
"encoder_dict_dataset": {
"class": "BEST2010LMDatasetWrapper",
"config": {
"base_data_dir": "_tmp_"
}
}
}
},
"dataset": {
"class": "WisesightDatasetWrapper",
"config": {
"base_data_dir": "_tmp_"
}
},
"input_transform": {
"class": "BERTSentencePiecePretrainWrapper",
"config": {
"column_id": 0,
"max_dict_size" : 15000,
"max_seq_length" : 256,
"is_input": true,
"is_pretrain": false,
"clf_id": 2
}
},
"output_transform": {
"class": "SingleClassTransformWrapper",
"config": {
"column_id": 1
}
},
"callbacks": [
],
"execution": {
"config": {
"optimizer": "bert",
"optimizer_params": [0.0005, 0.9, 0.997, 1e-9, 160, 1.0, 0.01],
"batch_size": 32,
"epochs": 30,
"watch_metric": "val_acc",
"output_dir": "_outputs_/finetune_best2010lm_bertlike12_s2s_sp_wisesight",
"save_weight_history": false,
"resume_if_possible": true
}
}
}