Yash1005 commited on
Commit
0bb2130
·
verified ·
1 Parent(s): 7bf2e1e

add eval metrics json

Browse files
Files changed (1) hide show
  1. eval_metrics.json +16 -16
eval_metrics.json CHANGED
@@ -2,26 +2,26 @@
2
  "n": 500,
3
  "threshold": 0.5,
4
  "max_seq_length": 3072,
5
- "is_valid_accuracy": 0.89,
6
- "category_set_accuracy": 0.054,
7
- "micro_f1": 0.3512092534174553,
8
- "macro_f1": 0.35552414101596475,
9
  "per_category_f1": {
10
- "DirectInjection": 0.5232558139534884,
11
- "Jailbreak": 0.39705882352941174,
12
- "Adversarial": 0.4,
13
- "Extraction": 0.2569444444444444,
14
- "Encoding": 0.373134328358209,
15
- "Manipulation": 0.2717391304347826,
16
- "Smuggling": 0.49122807017543857,
17
- "Indirect": 0.3228346456692913,
18
- "MultiTurn": 0.16352201257861634
19
  },
20
  "latency_ms_per_example": {
21
- "mean": 1.823335886001587,
22
- "p95": 1.9494213163852692,
23
  "device": "cuda:0"
24
  },
25
  "base_model": "jhu-clsp/mmBERT-base",
26
- "epochs": 3
27
  }
 
2
  "n": 500,
3
  "threshold": 0.5,
4
  "max_seq_length": 3072,
5
+ "is_valid_accuracy": 0.864,
6
+ "category_set_accuracy": 0.626,
7
+ "micro_f1": 0.7423664122137404,
8
+ "macro_f1": 0.7334963397298655,
9
  "per_category_f1": {
10
+ "DirectInjection": 0.9076923076923077,
11
+ "Jailbreak": 0.5773195876288659,
12
+ "Adversarial": 0.7941176470588235,
13
+ "Extraction": 0.7478260869565218,
14
+ "Encoding": 0.7123287671232876,
15
+ "Manipulation": 0.693069306930693,
16
+ "Smuggling": 0.8429752066115702,
17
+ "Indirect": 0.6730769230769231,
18
+ "MultiTurn": 0.6530612244897959
19
  },
20
  "latency_ms_per_example": {
21
+ "mean": 1.7679505981504917,
22
+ "p95": 1.7809227108955383,
23
  "device": "cuda:0"
24
  },
25
  "base_model": "jhu-clsp/mmBERT-base",
26
+ "epochs": 10
27
  }