-
Notifications
You must be signed in to change notification settings - Fork 0
/
ablation_record2.txt
108 lines (108 loc) · 17.3 KB
/
ablation_record2.txt
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
TREC_0.93000modelcnn_hidden_unit_num200_dropout_rate0.4_lr0.001_batch_size96_val_split0.1_layers8_n_head6_d_inner_hid256_roles['positional', 'both_direct', 'major_rels', 'separator', 'rare_word']_0.852
TREC_0.88200modelbilstm_hidden_unit_num200_dropout_rate0.3_lr0.001_batch_size96_val_split0.1_layers6_n_head6_d_inner_hid256_roles['positional', 'both_direct', 'major_rels', 'separator', 'rare_word']_15.918
SST_0.49890modelbilstm_hidden_unit_num200_dropout_rate0.3_lr0.0006_batch_size32_val_split0.1_layers4_n_head8_d_inner_hid256_roles['positional', 'both_direct', 'major_rels', 'separator', 'rare_word']_29.959
MR_0.50702modelbilstm_hidden_unit_num200_dropout_rate0.3_lr0.0006_batch_size32_val_split0.1_layers2_n_head6_d_inner_hid128_roles['positional', 'both_direct', 'major_rels', 'separator', 'rare_word']_65.094
ROTTENTOMATOES_0.50389modelbilstm_hidden_unit_num200_dropout_rate0.2_lr0.001_batch_size32_val_split0.1_layers8_n_head6_d_inner_hid256_roles['positional', 'both_direct', 'major_rels', 'separator', 'rare_word']_269.062
ROTTENTOMATOES_0.50389modelbilstm_hidden_unit_num100_dropout_rate0.2_lr0.0006_batch_size32_val_split0.1_layers4_n_head6_d_inner_hid256_roles['positional', 'both_direct', 'major_rels', 'separator', 'rare_word']_517.981
ROTTENTOMATOES_0.49610modelcnn_hidden_unit_num100_dropout_rate0.3_lr0.0006_batch_size96_val_split0.1_layers4_n_head6_d_inner_hid256_roles['positional', 'both_direct', 'major_rels', 'separator', 'rare_word']_5.434
ROTTENTOMATOES_0.50389modelbilstm_hidden_unit_num100_dropout_rate0.4_lr0.01_batch_size96_val_split0.1_layers4_n_head6_d_inner_hid512_roles['positional', 'both_direct', 'major_rels', 'separator', 'rare_word']_171.211
ROTTENTOMATOES_0.50389modelcnn_hidden_unit_num200_dropout_rate0.2_lr0.0006_batch_size32_val_split0.1_layers8_n_head8_d_inner_hid256_roles['positional', 'both_direct', 'major_rels', 'separator', 'rare_word']_16.098
ROTTENTOMATOES_0.79240modelbilstm_hidden_unit_num100_dropout_rate0.2_lr0.0006_batch_size64_val_split0.1_layers2_n_head8_d_inner_hid256_roles['positional', 'both_direct', 'major_rels', 'separator', 'rare_word']_140.201
SUBJ_0.92199modelcnn_hidden_unit_num100_dropout_rate0.4_lr0.0001_batch_size64_val_split0.1_layers4_n_head6_d_inner_hid128_roles['positional', 'both_direct', 'major_rels', 'separator', 'rare_word']_1.893
SST_0.80186modelbilstm_hidden_unit_num100_dropout_rate0.4_lr0.001_batch_size96_val_split0.1_layers2_n_head6_d_inner_hid256_roles['positional', 'both_direct', 'major_rels', 'separator', 'rare_word']_8.692
SUBJ_0.93199modelbilstm_hidden_unit_num200_dropout_rate0.4_lr0.001_batch_size96_val_split0.1_layers6_n_head6_d_inner_hid256_roles['positional', 'both_direct', 'major_rels', 'separator', 'rare_word']_21.149
TREC_0.92199modelcnn_hidden_unit_num100_dropout_rate0.3_lr0.001_batch_size32_val_split0.1_layers2_n_head6_d_inner_hid512_roles['positional', 'both_direct', 'major_rels', 'separator', 'rare_word']_2.284
MR_0.77507modelcnn_hidden_unit_num200_dropout_rate0.3_lr0.0005_batch_size32_val_split0.1_layers6_n_head8_d_inner_hid256_roles['positional', 'both_direct', 'major_rels', 'separator', 'rare_word']_3.947
ROTTENTOMATOES_0.63969modelbilstm_hidden_unit_num200_dropout_rate0.2_lr0.0001_batch_size64_val_split0.1_layers2_n_head6_d_inner_hid128_roles['positional', 'both_direct', 'major_rels', 'separator', 'rare_word']_131.097
MR_0.50702modelbilstm_hidden_unit_num200_dropout_rate0.4_lr0.001_batch_size96_val_split0.1_layers2_n_head6_d_inner_hid512_roles['positional', 'both_direct', 'major_rels', 'separator', 'rare_word']_12.78
MR_0.76382modelcnn_hidden_unit_num100_dropout_rate0.3_lr0.0001_batch_size64_val_split0.1_layers8_n_head6_d_inner_hid512_roles['positional']_0.963
SUBJ_0.92500modelcnn_hidden_unit_num100_dropout_rate0.3_lr0.0001_batch_size96_val_split0.1_layers6_n_head6_d_inner_hid128_roles['positional']_0.859
SUBJ_0.93699modelcnn_hidden_unit_num200_dropout_rate0.4_lr0.0005_batch_size32_val_split0.1_layers2_n_head6_d_inner_hid128_roles['positional']_1.746
SUBJ_0.51599modelcnn_hidden_unit_num200_dropout_rate0.4_lr0.0005_batch_size32_val_split0.1_layers6_n_head8_d_inner_hid128_roles['positional']_1.574
SUBJ_0.93300modelcnn_hidden_unit_num200_dropout_rate0.2_lr0.0001_batch_size96_val_split0.1_layers8_n_head6_d_inner_hid256_roles['positional']_0.715
SUBJ_0.93599modelcnn_hidden_unit_num200_dropout_rate0.2_lr0.0005_batch_size32_val_split0.1_layers8_n_head8_d_inner_hid128_roles['positional']_1.762
SUBJ_0.94099modelbilstm_hidden_unit_num100_dropout_rate0.3_lr0.001_batch_size64_val_split0.1_layers6_n_head8_d_inner_hid512_roles['positional']_14.028
SUBJ_0.91699modelbilstm_hidden_unit_num100_dropout_rate0.2_lr0.0001_batch_size64_val_split0.1_layers2_n_head8_d_inner_hid512_roles['positional']_13.222
SUBJ_0.48399modelcnn_hidden_unit_num200_dropout_rate0.4_lr0.001_batch_size32_val_split0.1_layers6_n_head6_d_inner_hid256_roles['positional']_1.614
MR_0.73851modelbilstm_hidden_unit_num200_dropout_rate0.3_lr0.0001_batch_size96_val_split0.1_layers6_n_head8_d_inner_hid512_roles['positional']_10.904
MR_0.77600modelcnn_hidden_unit_num100_dropout_rate0.4_lr0.0005_batch_size64_val_split0.1_layers8_n_head6_d_inner_hid256_roles['positional']_1.02
MR_0.72727modelbilstm_hidden_unit_num200_dropout_rate0.2_lr0.0005_batch_size96_val_split0.1_layers4_n_head8_d_inner_hid256_roles['positional']_10.745
MR_0.73383modelbilstm_hidden_unit_num200_dropout_rate0.3_lr0.0005_batch_size96_val_split0.1_layers2_n_head6_d_inner_hid128_roles['positional']_9.806
SUBJ_0.93000modelbilstm_hidden_unit_num200_dropout_rate0.3_lr0.0005_batch_size64_val_split0.1_layers6_n_head6_d_inner_hid256_roles['positional']_18.296
SUBJ_0.94199modelbilstm_hidden_unit_num100_dropout_rate0.4_lr0.001_batch_size96_val_split0.1_layers4_n_head6_d_inner_hid128_roles['positional']_12.532
SUBJ_0.93699modelbilstm_hidden_unit_num100_dropout_rate0.4_lr0.001_batch_size64_val_split0.1_layers2_n_head8_d_inner_hid128_roles['positional']_16.202
MR_0.64292modelbilstm_hidden_unit_num200_dropout_rate0.2_lr0.0005_batch_size64_val_split0.1_layers6_n_head6_d_inner_hid512_roles['positional']_20.029
IMDB_0.84500modelbilstm_hidden_unit_num100_dropout_rate0.4_lr0.0005_batch_size32_val_split0.1_layers4_n_head8_d_inner_hid256_roles['positional']_605.852
IMDB_0.64789modelbilstm_hidden_unit_num200_dropout_rate0.2_lr0.0001_batch_size96_val_split0.1_layers6_n_head6_d_inner_hid128_roles['positional']_203.859
IMDB_0.50389modelcnn_hidden_unit_num100_dropout_rate0.3_lr0.001_batch_size32_val_split0.1_layers8_n_head8_d_inner_hid256_roles['positional']_7.663
IMDB_0.50389modelbilstm_hidden_unit_num200_dropout_rate0.4_lr0.001_batch_size32_val_split0.1_layers6_n_head6_d_inner_hid512_roles['positional']_667.839
IMDB_0.50389modelcnn_hidden_unit_num100_dropout_rate0.3_lr0.0005_batch_size32_val_split0.1_layers6_n_head6_d_inner_hid256_roles['positional']_7.059
IMDB_0.80119modelbilstm_hidden_unit_num100_dropout_rate0.4_lr0.001_batch_size96_val_split0.1_layers8_n_head8_d_inner_hid512_roles['positional']_220.44
IMDB_0.84409modelbilstm_hidden_unit_num100_dropout_rate0.4_lr0.0005_batch_size64_val_split0.1_layers8_n_head8_d_inner_hid128_roles['positional']_305.457
IMDB_0.625modelbilstm_hidden_unit_num200_dropout_rate0.4_lr0.0001_batch_size64_val_split0.1_layers2_n_head6_d_inner_hid128_roles['positional']_330.241
IMDB_0.50389modelcnn_hidden_unit_num200_dropout_rate0.4_lr0.0005_batch_size96_val_split0.1_layers4_n_head8_d_inner_hid512_roles['positional']_5.81
IMDB_0.85240modelbilstm_hidden_unit_num100_dropout_rate0.2_lr0.0005_batch_size64_val_split0.1_layers6_n_head6_d_inner_hid128_roles['positional']_307.071
SST_0.81394modelcnn_hidden_unit_num100_dropout_rate0.3_lr0.001_batch_size32_val_split0.1_layers8_n_head8_d_inner_hid256_roles['positional']_1.263
SST_0.49890modelcnn_hidden_unit_num200_dropout_rate0.2_lr0.001_batch_size32_val_split0.1_layers6_n_head8_d_inner_hid128_roles['positional']_1.284
SST_0.78759modelbilstm_hidden_unit_num200_dropout_rate0.3_lr0.0001_batch_size32_val_split0.1_layers2_n_head8_d_inner_hid256_roles['positional']_21.266
SST_0.80515modelcnn_hidden_unit_num200_dropout_rate0.3_lr0.0001_batch_size96_val_split0.1_layers2_n_head6_d_inner_hid256_roles['positional']_0.542
SST_0.79747modelbilstm_hidden_unit_num100_dropout_rate0.2_lr0.0005_batch_size64_val_split0.1_layers6_n_head8_d_inner_hid256_roles['positional']_9.544
SST_0.80186modelcnn_hidden_unit_num100_dropout_rate0.3_lr0.0001_batch_size96_val_split0.1_layers2_n_head8_d_inner_hid256_roles['positional']_0.517
SST_0.80076modelcnn_hidden_unit_num100_dropout_rate0.2_lr0.0001_batch_size96_val_split0.1_layers6_n_head6_d_inner_hid512_roles['positional']_0.505
SST_0.51811modelbilstm_hidden_unit_num200_dropout_rate0.3_lr0.0005_batch_size32_val_split0.1_layers8_n_head8_d_inner_hid512_roles['positional']_19.708
SST_0.81503modelcnn_hidden_unit_num100_dropout_rate0.3_lr0.0005_batch_size32_val_split0.1_layers8_n_head6_d_inner_hid128_roles['positional']_1.29
SST_0.51701modelbilstm_hidden_unit_num200_dropout_rate0.4_lr0.001_batch_size96_val_split0.1_layers2_n_head8_d_inner_hid512_roles['positional']_6.583
SST_0.79967modelbilstm_hidden_unit_num100_dropout_rate0.2_lr0.0005_batch_size32_val_split0.1_layers2_n_head8_d_inner_hid256_roles['positional']_19.007
ROTTENTOMATOES_0.81160modelcnn_hidden_unit_num200_dropout_rate0.2_lr0.0001_batch_size64_val_split0.1_layers6_n_head8_d_inner_hid256_roles['positional']_4.468
ROTTENTOMATOES_0.49610modelbilstm_hidden_unit_num200_dropout_rate0.2_lr0.001_batch_size32_val_split0.1_layers8_n_head8_d_inner_hid512_roles['positional']_224.474
ROTTENTOMATOES_0.62769modelbilstm_hidden_unit_num100_dropout_rate0.2_lr0.0005_batch_size96_val_split0.1_layers2_n_head8_d_inner_hid512_roles['positional']_73.174
ROTTENTOMATOES_0.72920modelbilstm_hidden_unit_num200_dropout_rate0.2_lr0.0001_batch_size96_val_split0.1_layers2_n_head6_d_inner_hid512_roles['positional']_74.294
ROTTENTOMATOES_0.81629modelcnn_hidden_unit_num200_dropout_rate0.2_lr0.0001_batch_size64_val_split0.1_layers2_n_head8_d_inner_hid512_roles['positional']_4.499
ROTTENTOMATOES_0.49610modelcnn_hidden_unit_num200_dropout_rate0.4_lr0.001_batch_size96_val_split0.1_layers2_n_head6_d_inner_hid512_roles['positional']_2.894
ROTTENTOMATOES_0.79269modelbilstm_hidden_unit_num100_dropout_rate0.4_lr0.0005_batch_size64_val_split0.1_layers4_n_head8_d_inner_hid128_roles['positional']_109.061
ROTTENTOMATOES_0.80440modelbilstm_hidden_unit_num100_dropout_rate0.3_lr0.001_batch_size64_val_split0.1_layers6_n_head8_d_inner_hid512_roles['positional']_112.346
ROTTENTOMATOES_0.80949modelcnn_hidden_unit_num100_dropout_rate0.3_lr0.0005_batch_size96_val_split0.1_layers2_n_head8_d_inner_hid128_roles['positional']_3.029
ROTTENTOMATOES_0.78850modelbilstm_hidden_unit_num100_dropout_rate0.2_lr0.0001_batch_size32_val_split0.1_layers6_n_head8_d_inner_hid512_roles['positional']_198.508
DBPEDIA_0.97619modelbilstm_hidden_unit_num100_dropout_rate0.2_lr0.0005_batch_size64_val_split0.1_layers2_n_head6_d_inner_hid512_roles['positional']_774.256
DBPEDIA_0.97132modelbilstm_hidden_unit_num200_dropout_rate0.2_lr0.001_batch_size96_val_split0.1_layers6_n_head6_d_inner_hid512_roles['positional']_548.999
DBPEDIA_0.97698modelcnn_hidden_unit_num200_dropout_rate0.2_lr0.0005_batch_size32_val_split0.1_layers4_n_head6_d_inner_hid256_roles['positional']_95.732
TREC_0.89399modelbilstm_hidden_unit_num100_dropout_rate0.3_lr0.001_batch_size32_val_split0.1_layers4_n_head6_d_inner_hid256_roles['positional']_26.795
DBPEDIA_0.97585modelbilstm_hidden_unit_num200_dropout_rate0.3_lr0.0001_batch_size64_val_split0.1_layers4_n_head8_d_inner_hid128_roles['positional']_829.42
TREC_0.93199modelcnn_hidden_unit_num200_dropout_rate0.3_lr0.0005_batch_size64_val_split0.1_layers6_n_head8_d_inner_hid512_roles['positional']_0.78
TREC_0.89600modelbilstm_hidden_unit_num200_dropout_rate0.3_lr0.0005_batch_size64_val_split0.1_layers6_n_head6_d_inner_hid512_roles['positional']_13.003
TREC_0.88400modelbilstm_hidden_unit_num200_dropout_rate0.2_lr0.0001_batch_size64_val_split0.1_layers8_n_head6_d_inner_hid512_roles['positional']_12.599
TREC_0.91600modelcnn_hidden_unit_num100_dropout_rate0.4_lr0.0005_batch_size96_val_split0.1_layers6_n_head6_d_inner_hid128_roles['positional']_0.487
TREC_0.88999modelbilstm_hidden_unit_num100_dropout_rate0.4_lr0.001_batch_size32_val_split0.1_layers4_n_head6_d_inner_hid128_roles['positional']_22.131
TREC_0.93000modelcnn_hidden_unit_num200_dropout_rate0.3_lr0.0005_batch_size64_val_split0.1_layers6_n_head6_d_inner_hid128_roles['positional']_0.72
TREC_0.86000modelbilstm_hidden_unit_num100_dropout_rate0.3_lr0.0001_batch_size64_val_split0.1_layers8_n_head8_d_inner_hid512_roles['positional']_12.248
TREC_0.89800modelcnn_hidden_unit_num200_dropout_rate0.4_lr0.0001_batch_size64_val_split0.1_layers8_n_head6_d_inner_hid512_roles['positional']_0.758
TREC_0.88599modelcnn_hidden_unit_num100_dropout_rate0.4_lr0.0001_batch_size32_val_split0.1_layers4_n_head6_d_inner_hid128_roles['positional']_1.258
DBPEDIA_0.97649modelbilstm_hidden_unit_num100_dropout_rate0.3_lr0.001_batch_size64_val_split0.1_layers2_n_head6_d_inner_hid256_roles['positional']_827.697
TREC_0.91799modelcnn_hidden_unit_num300_dropout_rate0.3_lr0.0001_batch_size64_val_split0.1_layers2_n_head8_d_inner_hid128_roles['positional']_30.714
TREC_0.92599modelcnn_hidden_unit_num200_dropout_rate0.3_lr0.0005_batch_size96_val_split0.1_layers6_n_head8_d_inner_hid128_roles['positional']_21.785
TREC_0.88400modelbilstm_hidden_unit_num300_dropout_rate0.3_lr0.001_batch_size96_val_split0.1_layers4_n_head8_d_inner_hid256_roles['positional']_183.347
DBPEDIA_0.97611modelbilstm_hidden_unit_num200_dropout_rate0.3_lr0.0001_batch_size96_val_split0.1_layers4_n_head6_d_inner_hid256_roles['positional']_503.528
TREC_0.89399modelbilstm_hidden_unit_num300_dropout_rate0.4_lr0.0005_batch_size32_val_split0.1_layers8_n_head6_d_inner_hid512_roles['positional']_226.305
TREC_0.91600modelcnn_hidden_unit_num100_dropout_rate0.2_lr0.001_batch_size96_val_split0.1_layers8_n_head6_d_inner_hid512_roles['positional']_11.703
DBPEDIA_0.97477modelbilstm_hidden_unit_num100_dropout_rate0.3_lr0.0005_batch_size64_val_split0.1_layers8_n_head8_d_inner_hid512_roles['positional']_752.386
TREC_0.86400modelbilstm_hidden_unit_num200_dropout_rate0.4_lr0.0001_batch_size32_val_split0.1_layers6_n_head8_d_inner_hid256_roles['positional']_134.699
TREC_0.91399modelcnn_hidden_unit_num300_dropout_rate0.4_lr0.0001_batch_size32_val_split0.1_layers6_n_head6_d_inner_hid128_roles['positional']_31.338
TREC_0.91000modelcnn_hidden_unit_num200_dropout_rate0.3_lr0.0001_batch_size32_val_split0.1_layers2_n_head6_d_inner_hid512_roles['positional']_22.121
TREC_0.88400modelbilstm_hidden_unit_num200_dropout_rate0.3_lr0.0005_batch_size32_val_split0.1_layers6_n_head6_d_inner_hid128_roles['positional']_135.144
TREC_0.86000modelbilstm_hidden_unit_num300_dropout_rate0.2_lr0.0001_batch_size96_val_split0.1_layers6_n_head8_d_inner_hid512_roles['positional']_186.525
DBPEDIA_0.97617modelbilstm_hidden_unit_num100_dropout_rate0.3_lr0.0001_batch_size32_val_split0.1_layers2_n_head8_d_inner_hid256_roles['positional']_1653.846
IMDB_0.50389modelcnn_hidden_unit_num200_dropout_rate0.2_lr0.001_batch_size96_val_split0.1_layers6_n_head6_d_inner_hid256_roles['positional']_semEmbed732.487
IMDB_0.50389modelcnn_hidden_unit_num300_dropout_rate0.3_lr0.0005_batch_size32_val_split0.1_layers2_n_head8_d_inner_hid512_roles['positional']_semEmbed992.59
IMDB_0.87510modelcnn_hidden_unit_num200_dropout_rate0.2_lr0.0001_batch_size32_val_split0.1_layers2_n_head6_d_inner_hid128_roles['positional']_semEmbed778.772
IMDB_0.50389modelcnn_hidden_unit_num300_dropout_rate0.3_lr0.0005_batch_size64_val_split0.1_layers6_n_head8_d_inner_hid128_roles['positional']_semEmbed1005.375
IMDB_0.49610modelcnn_hidden_unit_num300_dropout_rate0.4_lr0.0005_batch_size32_val_split0.1_layers8_n_head8_d_inner_hid256_roles['positional']_semEmbed1095.354
IMDB_0.49610modelcnn_hidden_unit_num300_dropout_rate0.3_lr0.0005_batch_size64_val_split0.1_layers6_n_head8_d_inner_hid256_roles['positional']_semEmbed1083.765
IMDB_0.49610modelcnn_hidden_unit_num100_dropout_rate0.2_lr0.001_batch_size64_val_split0.1_layers8_n_head8_d_inner_hid512_roles['positional']_semEmbed377.499
YELP_0.92199modeltransformer_hidden_unit_num100_dropout_rate0.3_lr0.0005_batch_size32_val_split0.1_layers2_n_head8_d_inner_hid256_roles['positional', 'both_direct', 'major_rels']_310.294
YELP_0.92228modeltransformer_hidden_unit_num200_dropout_rate0.2_lr0.0005_batch_size64_val_split0.1_layers2_n_head8_d_inner_hid128_roles['positional', 'both_direct', 'major_rels']_220.918
YELP_0.92326modeltransformer_hidden_unit_num300_dropout_rate0.3_lr0.0001_batch_size32_val_split0.1_layers4_n_head6_d_inner_hid128_roles['positional', 'both_direct', 'major_rels']_461.179
YELP_0.92352modeltransformer_hidden_unit_num200_dropout_rate0.3_lr0.0005_batch_size64_val_split0.1_layers2_n_head6_d_inner_hid256_roles['positional', 'both_direct', 'major_rels']_201.635
YELP_0.91752modeltransformer_hidden_unit_num300_dropout_rate0.2_lr0.001_batch_size96_val_split0.1_layers8_n_head8_d_inner_hid128_roles['positional', 'both_direct', 'major_rels']_692.749
YELP_0.92221modeltransformer_hidden_unit_num100_dropout_rate0.2_lr0.0005_batch_size96_val_split0.1_layers2_n_head6_d_inner_hid128_roles['positional', 'both_direct', 'major_rels']_170.564
YELP_0.90731modeltransformer_hidden_unit_num100_dropout_rate0.3_lr0.0005_batch_size64_val_split0.1_layers6_n_head6_d_inner_hid512_roles['positional', 'both_direct', 'major_rels']_540.812
YELP_0.91186modeltransformer_hidden_unit_num300_dropout_rate0.2_lr0.0005_batch_size32_val_split0.1_layers4_n_head8_d_inner_hid128_roles['positional', 'both_direct', 'major_rels']_510.454