File size: 6,175 Bytes
bfc5ccd
 
 
 
 
 
 
 
1e56d6c
bfc5ccd
966103e
bfc5ccd
966103e
bfc5ccd
a747a13
bfc5ccd
425d6ee
bfc5ccd
 
 
425d6ee
bfc5ccd
425d6ee
bfc5ccd
5059791
bfc5ccd
5059791
bfc5ccd
5059791
bfc5ccd
425d6ee
bfc5ccd
425d6ee
 
 
 
 
 
 
 
 
bfc5ccd
425d6ee
bfc5ccd
425d6ee
bfc5ccd
425d6ee
bfc5ccd
425d6ee
bfc5ccd
425d6ee
bfc5ccd
425d6ee
bfc5ccd
425d6ee
bfc5ccd
425d6ee
bfc5ccd
425d6ee
bfc5ccd
64e08de
461ec0e
64e08de
bfc5ccd
dde3ca5
 
 
 
bfc5ccd
 
b681cf4
bfc5ccd
 
 
 
 
 
 
 
d2c8588
bfc5ccd
063249c
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
@media screen and (min-width: 70em) { .main-content { max-width: 70rem; padding: 2rem 6rem; margin: 0 auto; font-size: 1.1rem; } }
@font-face { font-family: 'flexslider-icon'; src: url("../fonts/flexslider-icon.eot"); src: url("../fonts/flexslider-icon.eot?#iefix") format("embedded-opentype"), url("../fonts/flexslider-icon.woff") format("woff"), url("../fonts/flexslider-icon.ttf") format("truetype"), url("../fonts/flexslider-icon.svg#flexslider-icon") format("svg"); font-weight: normal; font-style: normal; }
header h1, header h2 { font-weight: normal; line-height: normal; }

header h2 { margin-top: .83em; }

.main-content p { text-align: justify; }

.jailbreak-intro-sec { width: 80%; margin: 1em auto; }

#refusal-loss-formula .formula { text-align: center; }

#refusal-loss-formula .formula-list { width: fit-content; margin: 0 auto; }

#refusal-loss-formula .formula-list a { display: inline-block; width: 250px; margin: 0 20px; padding: 8px 10px; text-align: center; background: #DDD; cursor: pointer; text-decoration: none; color: #333; border-radius: 10px; user-select: none; transition-duration: 0.3s; }

#jailbreak-demo .radio-group { margin-right: 5px; }

input[type='radio'] { visibility: hidden; display: none; }

#jailbreak-demo .radio-group .option-label { font-size: 1em; cursor: pointer; position: relative; padding: 0.1em 0.6em; border: 1px solid #999; background: #FFF; border-radius: 0.2em; transition: 0.2s; }

#jailbreak-demo .radio-group .options:checked ~ .option-label { color: #FFF; background: #777; }

#refusal-loss-formula .formula-list a:hover, #jailbreak-demo #defense-methods .defense:hover { background: #555; color: #FFF; }

#jailbreak-demo #defense-methods .options:checked ~ .defense { color: #FFF; background: #555; }

#jailbreak-demo #defense-methods .defense { display: inline-block; width: 60%; margin: 2% auto 8%; padding: 8px 10px; text-align: center; background: #DDD; cursor: pointer; text-decoration: none; color: #333; border-radius: 10px; user-select: none; transition-duration: 0.3s; }

#jailbreak-demo .legend { text-align: center; width: 70%; margin: 0 auto; }

#jailbreak-demo .figure-option { text-align: center; width: 70%; margin: 4% auto 0; /* Customize the label (the container) */ /* Hide the browser's default checkbox */ /* Create a custom checkbox */ /* On mouse-over, add a grey background color */ /* When the checkbox is checked, add a blue background */ /* Create the checkmark/indicator (hidden when not checked) */ /* Show the checkmark when checked */ /* Style the checkmark/indicator */ }
#jailbreak-demo .figure-option .container { display: block; position: relative; padding-left: 35px; margin-bottom: 12px; cursor: pointer; font-size: 22px; -webkit-user-select: none; -moz-user-select: none; -ms-user-select: none; user-select: none; }
#jailbreak-demo .figure-option .container input { position: absolute; opacity: 0; cursor: pointer; height: 0; width: 0; }
#jailbreak-demo .figure-option .checkmark { position: absolute; top: 4px; left: 8px; height: 25px; width: 25px; background-color: #eee; }
#jailbreak-demo .figure-option .container:hover input ~ .checkmark { background-color: #ccc; }
#jailbreak-demo .figure-option .container input:checked ~ .checkmark { background-color: #9b9bff; }
#jailbreak-demo .figure-option .checkmark:after { content: ""; position: absolute; display: none; }
#jailbreak-demo .figure-option .container input:checked ~ .checkmark:after { display: block; }
#jailbreak-demo .figure-option .container .checkmark:after { left: 9px; top: 5px; width: 5px; height: 10px; border: solid white; border-width: 0 3px 3px 0; -webkit-transform: rotate(45deg); -ms-transform: rotate(45deg); transform: rotate(45deg); }

#jailbreak-demo .figure { margin: 0 auto; display: block; }

#jailbreak-demo .figure #original { display: none; }

#jailbreak-demo .figure img { user-drag: none; -webkit-user-drag: none; user-select: none; -khtml-user-drag: none; -moz-user-drag: none; -o-user-drag: none; pointer-events: none; position: relative; left: 35px; }

#jailbreak-demo .figure-caption { width: 240px; text-align: center; display: block; margin: 0 auto; padding: 10px 0 0; font-size: .8em; }

#jailbreak-demo .figure-caption ul { padding-left: 0; }

#jailbreak-demo .figure-caption ul li { list-style: none; }

#jailbreak-demo .figure-caption .model-prediction { font-weight: bold; }

#jailbreak-demo .figure-caption .correct { color: #009926; }

#jailbreak-demo .figure-caption .wrong { color: #e31327; }

#jailbreak-demo .attack-success-rate { display: inline-block; width: 60%; margin: 2% auto 8%; padding: 8px 10px; text-align: center; text-decoration: none; background: #DDD; color: #333; border-radius: 10px; user-select: none; }
#jailbreak-demo .attack-success-rate .jailbreak-metric { font-size: 0.75em; display: block; }
#jailbreak-demo .attack-success-rate .attack-success-rate-value { font-size: 1.5em; font-family: "sans-serif"; color: #820000; }

#jailbreak-demo .benign-refusal-rate { display: inline-block; width: 60%; margin: 2% auto 8%; padding: 8px 10px; text-align: center; text-decoration: none; background: #DDD; color: #333; border-radius: 10px; user-select: none; }
#jailbreak-demo .benign-refusal-rate .jailbreak-metric { font-size: 0.75em; display: block; }
#jailbreak-demo .benign-refusal-rate .benign-refusal-rate-value { font-size: 1.5em; font-family: "sans-serif"; color: #820000; }

.warning-quote { padding: 15px; font-size: 0.8em; background-color: #f43636ba; color: white; margin-bottom: 15px; border-left: 5px solid #ff3030; transition-duration: 0.3s; }

.closebtn { margin-left: 15px; color: white; font-weight: bold; float: right; font-size: 6px; line-height: 20px; cursor: pointer; transition: 0.3s; }

/* When moving the mouse over the close button */
.closebtn:hover { color: black; }

.slider-container { display: block; margin-top: 1em; margin-bottom: 0.5em; float: left; }

.slider-label { width: 140px; float: left; line-height: 1; }

.slider-content { width: 450px; position: relative; float: right; }

#ppl-threshold, #gradient-norm-threshold { width: 3em; height: 1.6em; top: 50%; margin-top: -.8em; text-align: center; line-height: 1.6em; }