NhatCuong22 commited on
Commit
4c6d5de
·
verified ·
1 Parent(s): 80939db

Upload benchmark/peerread_base_metrics.json

Browse files
benchmark/peerread_base_metrics.json ADDED
@@ -0,0 +1,85 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "label": "gemma4-base-v3",
3
+ "input": "/root/benchmark/results/peerread_base_v3_full.jsonl",
4
+ "n_papers": 95,
5
+ "venues": {
6
+ "acl_2017": 14,
7
+ "conll_2016": 3,
8
+ "iclr_2017": 78
9
+ },
10
+ "gen_time_s": {
11
+ "mean": 78.45,
12
+ "median": 74.94,
13
+ "total_min": 124.2
14
+ },
15
+ "review_words": {
16
+ "mean": 634.0,
17
+ "median": 631
18
+ },
19
+ "T2_decision_overall": {
20
+ "n": 95,
21
+ "accept_rate_true": 0.842,
22
+ "accept_rate_pred": 0.832,
23
+ "accuracy": 0.7368,
24
+ "precision": 0.8481,
25
+ "recall": 0.8375,
26
+ "f1": 0.8428
27
+ },
28
+ "T2_decision_per_venue": {
29
+ "acl_2017": {
30
+ "n": 14,
31
+ "accept_rate_true": 0.643,
32
+ "accept_rate_pred": 0.929,
33
+ "accuracy": 0.7143,
34
+ "precision": 0.6923,
35
+ "recall": 1.0,
36
+ "f1": 0.8182
37
+ },
38
+ "conll_2016": {
39
+ "n": 3,
40
+ "accept_rate_true": 0.333,
41
+ "accept_rate_pred": 1.0,
42
+ "accuracy": 0.3333,
43
+ "precision": 0.3333,
44
+ "recall": 1.0,
45
+ "f1": 0.5
46
+ },
47
+ "iclr_2017": {
48
+ "n": 78,
49
+ "accept_rate_true": 0.897,
50
+ "accept_rate_pred": 0.808,
51
+ "accuracy": 0.7564,
52
+ "precision": 0.9048,
53
+ "recall": 0.8143,
54
+ "f1": 0.8571
55
+ }
56
+ },
57
+ "T1_rouge_overall": {
58
+ "rouge1": {
59
+ "n": 95,
60
+ "mean_pct": 28.42
61
+ },
62
+ "rouge2": {
63
+ "n": 95,
64
+ "mean_pct": 6.6
65
+ },
66
+ "rougeL": {
67
+ "n": 95,
68
+ "mean_pct": 12.45
69
+ }
70
+ },
71
+ "T1_rouge_per_venue": {
72
+ "acl_2017": {
73
+ "n": 14,
74
+ "rougeL_mean_pct": 14.46
75
+ },
76
+ "conll_2016": {
77
+ "n": 3,
78
+ "rougeL_mean_pct": 15.75
79
+ },
80
+ "iclr_2017": {
81
+ "n": 78,
82
+ "rougeL_mean_pct": 11.96
83
+ }
84
+ }
85
+ }