-
Notifications
You must be signed in to change notification settings - Fork 0
/
results.yaml
551 lines (522 loc) · 10.3 KB
/
results.yaml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
- size: small
type: text
task: claim
frozen: false
split: cluster
model_id: sentence-transformers/LaBSE
train_loss: 0.365
train_factual_f1: 0.455
train_misinfo_f1: 0.946
val_loss: 0.433
val_factual_f1: 0.150
val_misinfo_f1: 0.925
test_loss: 0.396
test_factual_f1: 0.303
test_misinfo_f1: 0.948
- size: small
type: text
task: claim
frozen: true
split: cluster
model_id: sentence-transformers/LaBSE
train_loss: 0.459
train_factual_f1: 0.374
train_misinfo_f1: 0.917
val_loss: 0.513
val_factual_f1: 0.157
val_misinfo_f1: 0.903
test_loss: 0.511
test_factual_f1: 0.216
test_misinfo_f1: 0.934
- size: small
type: text
task: claim
frozen: false
split: random
model_id: sentence-transformers/LaBSE
train_loss: 0.699
train_factual_f1: 0.691
train_misinfo_f1: 0.962
val_loss: 3.880
val_factual_f1: 0.152
val_misinfo_f1: 0.852
test_loss: 3.192
test_factual_f1: 0.325
test_misinfo_f1: 0.852
- size: medium
type: text
task: claim
frozen: false
split: cluster
model_id: sentence-transformers/LaBSE
train_loss: 0.183
train_factual_f1: 0.608
train_misinfo_f1: 0.965
val_loss: 0.327
val_factual_f1: 0.290
val_misinfo_f1: 0.964
test_loss: 0.515
test_factual_f1: 0.195
test_misinfo_f1: 0.922
- size: medium
type: text
task: claim
frozen: true
split: cluster
model_id: sentence-transformers/LaBSE
train_loss: 0.425
train_factual_f1: 0.333
train_misinfo_f1: 0.942
val_loss: 0.342
val_factual_f1: 0.237
val_misinfo_f1: 0.952
test_loss: 0.507
test_factual_f1: 0.173
test_misinfo_f1: 0.909
- size: medium
type: text
task: claim
frozen: false
split: random
model_id: sentence-transformers/LaBSE
train_loss: 0.011
train_factual_f1: 0.987
train_misinfo_f1: 0.999
val_loss: 2.857
val_factual_f1: 0.268
val_misinfo_f1: 0.931
test_loss: 1.949
test_factual_f1: 0.315
test_misinfo_f1: 0.941
- size: large
type: text
task: claim
frozen: false
split: cluster
model_id: sentence-transformers/LaBSE
train_loss: 0.183
train_factual_f1: 0.529
train_misinfo_f1: 0.968
val_loss: 0.220
val_factual_f1: 0.299
val_misinfo_f1: 0.974
test_loss: 0.317
test_factual_f1: 0.217
test_misinfo_f1: 0.941
- size: large
type: text
task: claim
frozen: true
split: cluster
model_id: sentence-transformers/LaBSE
train_loss: 0.400
train_factual_f1: 0.300
train_misinfo_f1: 0.950
val_loss: 0.309
val_factual_f1: 0.262
val_misinfo_f1: 0.966
test_loss: 0.378
test_factual_f1: 0.160
test_misinfo_f1: 0.940
- size: large
type: text
task: claim
frozen: false
split: random
model_id: sentence-transformers/LaBSE
train_loss: 0.249
train_factual_f1: 0.803
train_misinfo_f1: 0.987
val_loss: 1.225
val_factual_f1: 0.353
val_misinfo_f1: 0.946
test_loss: 1.502
test_factual_f1: 0.300
test_misinfo_f1: 0.930
- size: small
type: text
task: tweet
frozen: false
split: cluster
model_id: sentence-transformers/LaBSE
train_loss: 0.030
train_factual_f1: 0.984
train_misinfo_f1: 0.999
val_loss: 1.281
val_factual_f1: 0.040
val_misinfo_f1: 0.927
test_loss: 1.227
test_factual_f1: 0.152
test_misinfo_f1: 0.938
- size: small
type: text
task: tweet
frozen: false
split: random
model_id: sentence-transformers/LaBSE
train_loss: 0.027
train_factual_f1: 0.983
train_misinfo_f1: 0.999
val_loss: 1.468
val_factual_f1: 0.476
val_misinfo_f1: 0.965
test_loss: 1.000
test_factual_f1: 0.567
test_misinfo_f1: 0.970
- size: medium
type: text
task: tweet
frozen: false
split: cluster
model_id: sentence-transformers/LaBSE
train_loss: 0.006
train_factual_f1: 0.996
train_misinfo_f1: 1.000
val_loss: 2.146
val_factual_f1: 0.164
val_misinfo_f1: 0.959
test_loss: 3.040
test_factual_f1: 0.207
test_misinfo_f1: 0.942
- size: medium
type: text
task: tweet
frozen: false
split: random
model_id: sentence-transformers/LaBSE
train_loss: 0.021
train_factual_f1: 0.979
train_misinfo_f1: 0.999
val_loss: 1.627
val_factual_f1: 0.671
val_misinfo_f1: 0.981
test_loss: 0.895
test_factual_f1: 0.650
test_misinfo_f1: 0.985
- size: large
type: text
task: tweet
frozen: false
split: cluster
model_id: sentence-transformers/LaBSE
train_loss: 0.825
train_factual_f1: 0.142
train_misinfo_f1: 0.975
val_loss: 0.391
val_factual_f1: 0.071
val_misinfo_f1: 0.989
test_loss: 0.415
test_factual_f1: 0.078
test_misinfo_f1: 0.978
- size: large
type: text
task: tweet
frozen: false
split: random
model_id: sentence-transformers/LaBSE
train_loss: 0.038
train_factual_f1: 0.914
train_misinfo_f1: 0.996
val_loss: 1.392
val_factual_f1: 0.516
val_misinfo_f1: 0.980
test_loss: 0.909
test_factual_f1: 0.558
test_misinfo_f1: 0.982
- size: small
type: image
dropout: 0.2
frozen: false
split: cluster
model_id: google/vit-base-patch16-224-in21k
train_loss: 0.081
train_factual_f1: 0.889
train_misinfo_f1: 0.986
val_loss: 1.775
val_factual_f1: 0.059
val_misinfo_f1: 0.888
test_loss: 3.097
test_factual_f1: 0.194
test_misinfo_f1: 0.870
- size: medium
type: image
dropout: 0.2
frozen: false
split: cluster
model_id: google/vit-base-patch16-224-in21k
train_loss: 0.013
train_factual_f1: 0.942
train_misinfo_f1: 0.995
val_loss: 1.158
val_factual_f1: 0.047
val_misinfo_f1: 0.953
test_loss: 2.669
test_factual_f1: 0.105
test_misinfo_f1: 0.935
- size: large
type: image
dropout: 0.2
frozen: false
split: cluster
model_id: google/vit-base-patch16-224-in21k
train_loss: 0.032
train_factual_f1: 0.842
train_misinfo_f1: 0.989
val_loss: 0.623
val_factual_f1: 0.000
val_misinfo_f1: 0.987
test_loss: 2.338
test_factual_f1: 0.035
test_misinfo_f1: 0.939
- size: small
type: graph
task: claim
split: cluster
nhops: 2
hetero_layer_norm: true
hidden_dim: 1024
batch_size: 1024
input_dropout: 0.2
dropout: 0.2
lr: 3e-4
epochs: 300
pos_weight: 20
train_loss: 0.414
train_factual_f1: 0.563
val_loss: 2.898
val_factual_f1: 0.006
val_misinfo_f1: 0.857
test_loss: 3.405
test_factual_f1: 0.267
test_misinfo_f1: 0.892
- size: medium
type: graph
task: claim
split: cluster
nhops: 2
hetero_layer_norm: true
hidden_dim: 1024
batch_size: 1024
input_dropout: 0.2
dropout: 0.2
lr: 3e-4
epochs: 300
pos_weight: 20
train_loss: 0.389
train_factual_f1: 0.529
val_loss: 1.50
val_factual_f1: 0.155
val_misinfo_f1: 0.916
test_loss: 2.243
test_factual_f1: 0.250
test_misinfo_f1: 0.904
- size: large
type: graph
task: claim
split: cluster
nhops: 2
hetero_layer_norm: true
hidden_dim: 1024
batch_size: 1024
input_dropout: 0.2
dropout: 0.2
lr: 3e-4
epochs: 300
pos_weight: 20
train_loss: 0.232
train_factual_f1: 0.626
val_loss: 2.049
val_factual_f1: 0.285
val_misinfo_f1: 0.952
test_loss: 2.003
test_factual_f1: 0.277
test_misinfo_f1: 0.919
- size: small
type: graph
task: tweet
split: cluster
nhops: 2
hetero_layer_norm: true
hidden_dim: 1024
batch_size: 1024
input_dropout: 0.2
dropout: 0.2
lr: 3e-4
epochs: 300
pos_weight: 20
train_loss: 0.168
train_factual_f1: 0.805
val_loss: 1.639
val_factual_f1: 0.038
val_misinfo_f1: 0.902
test_loss: 4.786
test_factual_f1: 0.189
test_misinfo_f1: 0.932
- size: medium
type: graph
task: tweet
split: cluster
nhops: 2
hetero_layer_norm: true
hidden_dim: 1024
batch_size: 1024
input_dropout: 0.2
dropout: 0.2
lr: 3e-4
epochs: 300
pos_weight: 20
train_loss: 0.139
train_factual_f1: 0.809
val_loss: 2.424
val_factual_f1: 0.270
val_misinfo_f1: 0.932
test_loss: 8.403
test_factual_f1: 0.173
test_misinfo_f1: 0.909
- size: large
type: graph
task: tweet
split: cluster
nhops: 2
hetero_layer_norm: true
hidden_dim: 1024
batch_size: 1024
input_dropout: 0.2
dropout: 0.2
lr: 3e-4
epochs: 300
pos_weight: 20
train_loss: 0.120
train_factual_f1: 0.814
val_loss: 2.17
val_factual_f1: 0.260
val_misinfo_f1: 0.971
test_loss: 3.369
test_factual_f1: 0.269
test_misinfo_f1: 0.960
- size: small
type: graph
task: claim
split: random
nhops: 2
hetero_layer_norm: true
hidden_dim: 1024
batch_size: 1024
input_dropout: 0.2
dropout: 0.2
lr: 3e-4
epochs: 300
pos_weight: 20
train_loss: 0.424
train_factual_f1: 0.565
val_loss: 3.514
val_factual_f1: 0.423
val_misinfo_f1: 0.921
test_loss: 2.642
test_factual_f1: 0.083
test_misinfo_f1: 0.887
- size: medium
type: graph
task: claim
split: random
nhops: 2
hetero_layer_norm: true
hidden_dim: 1024
batch_size: 1024
input_dropout: 0.2
dropout: 0.2
lr: 3e-4
epochs: 300
pos_weight: 20
train_loss: 0.311
train_factual_f1: 0.558
val_loss: 2.277
val_factual_f1: 0.415
val_misinfo_f1: 0.938
test_loss: 2.672
test_factual_f1: 0.294
test_misinfo_f1: 0.934
- size: large
type: graph
task: claim
split: random
nhops: 2
hetero_layer_norm: true
hidden_dim: 1024
batch_size: 1024
input_dropout: 0.2
dropout: 0.2
lr: 3e-4
epochs: 300
pos_weight: 20
train_loss: 0.321
train_factual_f1: 0.510
val_loss: 2.400
val_factual_f1: 0.409
val_misinfo_f1: 0.938
test_loss: 1.736
test_factual_f1: 0.311
test_misinfo_f1: 0.940
- size: small
type: graph
task: tweet
split: random
nhops: 2
hetero_layer_norm: true
hidden_dim: 1024
batch_size: 1024
input_dropout: 0.2
dropout: 0.2
lr: 3e-4
epochs: 300
pos_weight: 20
train_loss: 0.106
train_factual_f1: 0.854
val_loss: 4.404
val_factual_f1: 0.585
val_misinfo_f1: 0.957
test_loss: 4.584
test_factual_f1: 0.537
test_misinfo_f1: 0.961
- size: medium
type: graph
task: tweet
split: random
nhops: 2
hetero_layer_norm: true
hidden_dim: 1024
batch_size: 1024
input_dropout: 0.2
dropout: 0.2
lr: 3e-4
epochs: 300
pos_weight: 20
train_loss: 0.176
train_factual_f1: 0.746
val_loss: 1.717
val_factual_f1: 0.653
val_misinfo_f1: 0.955
test_loss: 1.178
test_factual_f1: 0.807
test_misinfo_f1: 0.983
- size: large
type: graph
task: tweet
split: random
nhops: 2
hetero_layer_norm: true
hidden_dim: 1024
batch_size: 1024
input_dropout: 0.2
dropout: 0.2
lr: 3e-4
epochs: 300
pos_weight: 20
train_loss: 0.116
train_factual_f1: 0.811
val_loss: 1.784
val_factual_f1: 0.634
val_misinfo_f1: 0.977
test_loss: 1.995
test_factual_f1: 0.620
test_misinfo_f1: 0.976