File size: 2,957 Bytes
f170b94
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
<svg xmlns="http://www.w3.org/2000/svg" width="920" height="430" viewBox="0 0 920 430" role="img" aria-labelledby="title desc">
  <title id="title">Final SABER HarmBench calibration</title>
  <desc id="desc">Bar chart comparing previous SABER and final NSC-ACE-SABER on HarmBench keyword refusal and classifier ASR.</desc>
  <rect width="920" height="430" fill="#ffffff"/>
  <text x="40" y="42" font-family="Arial, sans-serif" font-size="24" font-weight="700" fill="#111827">Final HarmBench Calibration</text>
  <text x="40" y="72" font-family="Arial, sans-serif" font-size="14" fill="#4b5563">HarmBench text subset, n=320. Lower keyword refusal means less boilerplate refusal wording; ASR remains gated.</text>
  <line x1="88" y1="332" x2="850" y2="332" stroke="#d1d5db" stroke-width="1"/>
  <line x1="88" y1="112" x2="88" y2="332" stroke="#d1d5db" stroke-width="1"/>
  <line x1="88" y1="277" x2="850" y2="277" stroke="#eef2f7" stroke-width="1"/>
  <line x1="88" y1="222" x2="850" y2="222" stroke="#eef2f7" stroke-width="1"/>
  <line x1="88" y1="167" x2="850" y2="167" stroke="#eef2f7" stroke-width="1"/>
  <text x="54" y="337" font-family="Arial, sans-serif" font-size="12" fill="#6b7280">0%</text>
  <text x="47" y="282" font-family="Arial, sans-serif" font-size="12" fill="#6b7280">2%</text>
  <text x="47" y="227" font-family="Arial, sans-serif" font-size="12" fill="#6b7280">4%</text>
  <text x="47" y="172" font-family="Arial, sans-serif" font-size="12" fill="#6b7280">6%</text>
  <text x="47" y="117" font-family="Arial, sans-serif" font-size="12" fill="#6b7280">8%</text>
  <rect x="180" y="152" width="86" height="180" rx="4" fill="#2563eb"/>
  <rect x="286" y="220" width="86" height="112" rx="4" fill="#14b8a6"/>
  <rect x="550" y="315" width="86" height="17" rx="4" fill="#2563eb"/>
  <rect x="656" y="332" width="86" height="0" rx="4" fill="#14b8a6"/>
  <text x="175" y="142" font-family="Arial, sans-serif" font-size="14" font-weight="700" fill="#111827">6.56%</text>
  <text x="281" y="210" font-family="Arial, sans-serif" font-size="14" font-weight="700" fill="#111827">4.06%</text>
  <text x="540" y="305" font-family="Arial, sans-serif" font-size="14" font-weight="700" fill="#111827">0.63%</text>
  <text x="650" y="318" font-family="Arial, sans-serif" font-size="14" font-weight="700" fill="#111827">0.00%</text>
  <text x="185" y="365" font-family="Arial, sans-serif" font-size="14" font-weight="700" fill="#111827">Keyword Refusal</text>
  <text x="571" y="365" font-family="Arial, sans-serif" font-size="14" font-weight="700" fill="#111827">Classifier ASR</text>
  <rect x="285" y="392" width="14" height="14" rx="2" fill="#2563eb"/>
  <text x="307" y="404" font-family="Arial, sans-serif" font-size="13" fill="#374151">Previous SABER</text>
  <rect x="464" y="392" width="14" height="14" rx="2" fill="#14b8a6"/>
  <text x="486" y="404" font-family="Arial, sans-serif" font-size="13" fill="#374151">Final NSC-ACE-SABER</text>
</svg>