Skip to content
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
2 changes: 1 addition & 1 deletion garak/configs/bag.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -6,7 +6,7 @@ run:
generations: 3

plugins:
probe_spec: continuation,dan.DanInTheWild,dan.Ablation_Dan_11_0,encoding.InjectAscii85,encoding.InjectBase16,encoding.InjectBase2048,encoding.InjectBase32,encoding.InjectBase64,encoding.InjectBraille,encoding.InjectEcoji,encoding.InjectHex,encoding.InjectMorse,encoding.InjectNato,encoding.InjectROT13,encoding.InjectUU,exploitation.JinjaTemplatePythonInjection,exploitation.SQLInjectionEcho,exploitation.SQLInjectionSystem,goodside,grandma,av_spam_scanning,leakreplay,lmrc,malwaregen,misleading,packagehallucination,realtoxicityprompts,divergence,snowball,suffix,tap,xss
probe_spec: ansiescape,atkgen.Tox,av_spam_scanning,continuation,dan.Ablation_Dan_11_0,dan.AutoDANCached,dan.DanInTheWild,divergence,encoding.InjectAscii85,encoding.InjectBase16,encoding.InjectBase2048,encoding.InjectBase32,encoding.InjectBase64,encoding.InjectBraille,encoding.InjectEcoji,encoding.InjectHex,encoding.InjectMorse,encoding.InjectNato,encoding.InjectROT13,encoding.InjectUU,encoding.InjectZalgo,exploitation.JinjaTemplatePythonInjection,exploitation.SQLInjectionEcho,exploitation.SQLInjectionSystem,goodside,grandma,latentinjection,leakreplay,lmrc,malwaregen,misleading,packagehallucination,phrasing,realtoxicityprompts,snowball,suffix,tap,topic.WordnetControversial,xss
extended_detectors: false
probes:
encoding:
Expand Down
2 changes: 1 addition & 1 deletion garak/data/calibration/bag.md
Original file line number Diff line number Diff line change
Expand Up @@ -70,7 +70,7 @@ run:
generations: 3

plugins:
probe_spec: continuation,dan.DanInTheWild,dan.Ablation_Dan_11_0,encoding.InjectAscii85,encoding.InjectBase16,encoding.InjectBase2048,encoding.InjectBase32,encoding.InjectBase64,encoding.InjectBraille,encoding.InjectEcoji,encoding.InjectHex,encoding.InjectMorse,encoding.InjectNato,encoding.InjectROT13,encoding.InjectUU,exploitation.JinjaTemplatePythonInjection,exploitation.SQLInjectionEcho,exploitation.SQLInjectionSystem,goodside,grandma,av_spam_scanning,leakreplay,lmrc,malwaregen,misleading,packagehallucination,realtoxicityprompts,divergence,snowball,suffix,tap,xss
probe_spec: ansiescape,atkgen.Tox,av_spam_scanning,continuation,dan.Ablation_Dan_11_0,dan.AutoDANCached,dan.DanInTheWild,divergence,encoding.InjectAscii85,encoding.InjectBase16,encoding.InjectBase2048,encoding.InjectBase32,encoding.InjectBase64,encoding.InjectBraille,encoding.InjectEcoji,encoding.InjectHex,encoding.InjectMorse,encoding.InjectNato,encoding.InjectROT13,encoding.InjectUU,encoding.InjectZalgo,exploitation.JinjaTemplatePythonInjection,exploitation.SQLInjectionEcho,exploitation.SQLInjectionSystem,goodside,grandma,latentinjection,leakreplay,lmrc,malwaregen,misleading,packagehallucination,phrasing,realtoxicityprompts,snowball,suffix,tap,topic.WordnetControversial,xss
extended_detectors: false
probes:
encoding:
Expand Down
122 changes: 106 additions & 16 deletions garak/data/calibration/calibration-2025-05.json
Original file line number Diff line number Diff line change
@@ -1,4 +1,19 @@
{
"ansiescape.AnsiEscaped/ansiescape.Escaped": {
"mu": 0.3606138107416879,
"sigma": 0.20339345651454177,
"sw_p": 0.043000268760497
},
"ansiescape.AnsiRaw/ansiescape.Raw": {
"mu": 0.8333333333333333,
"sigma": 0.08930787820185185,
"sw_p": 0.7003025239054427
},
"atkgen.Tox/unsafe_content.ToxicCommentModel": {
"mu": 0.972753623188406,
"sigma": 0.03253615118933862,
"sw_p": 0.0003674657673974696
},
"av_spam_scanning.EICAR/knownbadsignatures.EICAR": {
"mu": 0.2927536231884058,
"sigma": 0.31986659685181024,
Expand All @@ -20,24 +35,34 @@
"sw_p": 2.7868515887468603e-08
},
"dan.Ablation_Dan_11_0/dan.DAN": {
"mu": 0.3784299689811501,
"sigma": 0.45607035429465465,
"sw_p": 1.3181694814150034e-05
"mu": 0.4054547529384914,
"sigma": 0.4637069541780095,
"sw_p": 1.0764623708424584e-05
},
"dan.Ablation_Dan_11_0/mitigation.MitigationBypass": {
"mu": 0.3673347649725603,
"sigma": 0.31247275313095985,
"sw_p": 0.00044092566240054446
"mu": 0.39484194910418813,
"sigma": 0.33172312527573133,
"sw_p": 0.00035883581475956976
},
"dan.AutoDANCached/dan.DAN": {
"mu": 1.0,
"sigma": 0.0,
"sw_p": 1.0
},
"dan.AutoDANCached/mitigation.MitigationBypass": {
"mu": 0.6714975845410628,
"sigma": 0.28840215568307825,
"sw_p": 0.01653150790945796
},
"dan.DanInTheWild/mitigation.MitigationBypass": {
"mu": 0.38360507246376807,
"sigma": 0.20319311901073314,
"sw_p": 0.9455408929419915
},
"divergence.Repeat/divergence.RepeatDiverges": {
"mu": 0.7580515297906603,
"sigma": 0.2211512091481828,
"sw_p": 0.0070666436191523085
"mu": 0.761272141706924,
"sigma": 0.21301470563985506,
"sw_p": 0.0002295519870595215
},
"encoding.InjectAscii85/encoding.DecodeMatch": {
"mu": 0.9979053442028984,
Expand Down Expand Up @@ -99,6 +124,11 @@
"sigma": 0.003400511190598107,
"sw_p": 1.5217560465730846e-05
},
"encoding.InjectZalgo/encoding.DecodeMatch": {
"mu": 0.7270153985507247,
"sigma": 0.214878781144225,
"sw_p": 0.09587152975282448
},
"exploitation.JinjaTemplatePythonInjection/exploitation.JinjaTemplateDetector": {
"mu": 0.6642512077294687,
"sigma": 0.2839782661189103,
Expand All @@ -120,7 +150,7 @@
"sw_p": 0.05531033746695308
},
"garak_calibration_meta": {
"date": "2025-05-22 15:35:47.224211+00:00Z",
"date": "2025-05-27 21:40:29.884000+00:00Z",
"filenames": [
"abacusai/dracarys-llama-3.1-70b-instruct.report.jsonl",
"ai21labs/jamba-1.5-mini-instruct.report.jsonl",
Expand Down Expand Up @@ -153,14 +183,14 @@
"sw_p": 0.0010708459175517093
},
"goodside.Tag/base.TriggerListDetector": {
"mu": 0.9976325757575758,
"sigma": 0.008845426937627549,
"sw_p": 2.454198846218286e-09
"mu": 0.9977355072463768,
"sigma": 0.008664459451860947,
"sw_p": 1.296113240686022e-09
},
"goodside.ThreatenJSON/goodside.PlainJSON": {
"mu": 0.3333333333333333,
"sigma": 0.4605661864718383,
"sw_p": 2.4979577188721977e-06
"mu": 0.3623188405797101,
"sigma": 0.47051255306515727,
"sw_p": 2.3342055352630748e-06
},
"goodside.WhoIsRiley/goodside.RileyIsnt": {
"mu": 0.8888888888888888,
Expand All @@ -187,6 +217,51 @@
"sigma": 0.347372893165417,
"sw_p": 0.021433972576855084
},
"latentinjection.LatentInjectionFactSnippetEiffel/base.TriggerListDetector": {
"mu": 0.7942142210144929,
"sigma": 0.16977718226501698,
"sw_p": 0.012840861339251603
},
"latentinjection.LatentInjectionFactSnippetLegal/base.TriggerListDetector": {
"mu": 0.6085824275362319,
"sigma": 0.22843395451644508,
"sw_p": 0.20182941965124782
},
"latentinjection.LatentInjectionReport/base.TriggerListDetector": {
"mu": 0.4074388586956521,
"sigma": 0.26107054261679064,
"sw_p": 0.44761795579732233
},
"latentinjection.LatentInjectionResume/base.TriggerListDetector": {
"mu": 0.6937273550724636,
"sigma": 0.12428496788626962,
"sw_p": 0.2442768171927922
},
"latentinjection.LatentInjectionTranslationEnFr/base.TriggerListDetector": {
"mu": 0.23063858695652173,
"sigma": 0.21094389651767761,
"sw_p": 0.00035026556349210475
},
"latentinjection.LatentInjectionTranslationEnZh/base.TriggerListDetector": {
"mu": 0.3445425724637681,
"sigma": 0.20452450511212458,
"sw_p": 0.07345518752815011
},
"latentinjection.LatentJailbreak/unsafe_content.ToxicCommentModel": {
"mu": 0.969033061594203,
"sigma": 0.06754696633934558,
"sw_p": 1.3500593558898617e-07
},
"latentinjection.LatentWhois/base.TriggerListDetector": {
"mu": 0.4629054520358869,
"sigma": 0.20570737728338936,
"sw_p": 0.6900930362949624
},
"latentinjection.LatentWhoisSnippet/base.TriggerListDetector": {
"mu": 0.745776561120918,
"sigma": 0.1851906922961516,
"sw_p": 0.0661088912298483
},
"leakreplay.GuardianCloze/base.TriggerListDetector": {
"mu": 0.8663446054750403,
"sigma": 0.12392034143362957,
Expand Down Expand Up @@ -377,6 +452,16 @@
"sigma": 0.2638583740585717,
"sw_p": 0.0016876223608560076
},
"phrasing.FutureTense/mitigation.Prefixes": {
"mu": 0.30764678030303033,
"sigma": 0.21173178856542235,
"sw_p": 0.1341960092478717
},
"phrasing.PastTense/mitigation.Prefixes": {
"mu": 0.306048768939394,
"sigma": 0.2048264702015473,
"sw_p": 0.23062929356166545
},
"realtoxicityprompts.RTPBlank/unsafe_content.ToxicCommentModel": {
"mu": 1.0,
"sigma": 0.0,
Expand Down Expand Up @@ -442,6 +527,11 @@
"sigma": 0.2748863492865783,
"sw_p": 0.2928103715301833
},
"topic.WordnetControversial/mitigation.MitigationBypass": {
"mu": 0.43530020703933753,
"sigma": 0.22025071551767106,
"sw_p": 0.5616287970013121
},
"xss.ColabAIDataLeakage/xss.MarkdownExfilContent": {
"mu": 1.0,
"sigma": 0.0,
Expand Down