File size: 5,725 Bytes
bfc5ccd
 
 
 
 
 
 
 
1e56d6c
bfc5ccd
966103e
bfc5ccd
966103e
bfc5ccd
cb2376f
bfc5ccd
425d6ee
bfc5ccd
 
 
425d6ee
bfc5ccd
425d6ee
bfc5ccd
89dec80
bfc5ccd
89dec80
bfc5ccd
89dec80
bfc5ccd
425d6ee
bfc5ccd
425d6ee
 
 
 
 
 
 
 
 
bfc5ccd
425d6ee
bfc5ccd
425d6ee
bfc5ccd
425d6ee
bfc5ccd
425d6ee
bfc5ccd
425d6ee
bfc5ccd
425d6ee
bfc5ccd
425d6ee
bfc5ccd
425d6ee
bfc5ccd
425d6ee
bfc5ccd
64e08de
461ec0e
64e08de
bfc5ccd
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
@media screen and (min-width: 70em) { .main-content { max-width: 70rem; padding: 2rem 6rem; margin: 0 auto; font-size: 1.1rem; } }
@font-face { font-family: 'flexslider-icon'; src: url("../fonts/flexslider-icon.eot"); src: url("../fonts/flexslider-icon.eot?#iefix") format("embedded-opentype"), url("../fonts/flexslider-icon.woff") format("woff"), url("../fonts/flexslider-icon.ttf") format("truetype"), url("../fonts/flexslider-icon.svg#flexslider-icon") format("svg"); font-weight: normal; font-style: normal; }
header h1, header h2 { font-weight: normal; line-height: normal; }

header h2 { margin-top: .83em; }

.main-content p { text-align: justify; }

.jailbreak-intro-sec { width: 80%; margin: 1em auto; }

#refusal-loss-formula .formula { text-align: center; }

#refusal-loss-formula .formula-list { width: fit-content; margin: 0 auto; }

#refusal-loss-formula .formula-list a { display: inline-block; width: 150px; margin: 0 20px; padding: 8px 10px; text-align: center; background: #DDD; cursor: pointer; text-decoration: none; color: #333; border-radius: 10px; user-select: none; transition-duration: 0.3s; }

#jailbreak-demo .radio-group { margin-right: 5px; }

input[type='radio'] { visibility: hidden; display: none; }

#jailbreak-demo .radio-group .option-label { font-size: 1em; cursor: pointer; position: relative; padding: 0.1em 0.6em; border: 1px solid #999; background: #FFF; border-radius: 0.2em; transition: 0.2s; }

#jailbreak-demo .radio-group .options:checked ~ .option-label { color: #FFF; background: #777; }

#refusal-loss-formula .formula-list a:hover, #jailbreak-demo #defense-methods .calibrate-tool:hover { background: #555; color: #FFF; }

#jailbreak-demo #defense-methods .options:checked ~ .calibrate-tool { color: #FFF; background: #555; }

#jailbreak-demo #defense-methods .calibrate-tool { display: inline-block; width: 60%; margin: 2% auto 8%; padding: 8px 10px; text-align: center; background: #DDD; cursor: pointer; text-decoration: none; color: #333; border-radius: 10px; user-select: none; transition-duration: 0.3s; }

#jailbreak-demo .legend { text-align: center; width: 70%; margin: 0 auto; }

#jailbreak-demo .figure-option { text-align: center; width: 70%; margin: 4% auto 0; /* Customize the label (the container) */ /* Hide the browser's default checkbox */ /* Create a custom checkbox */ /* On mouse-over, add a grey background color */ /* When the checkbox is checked, add a blue background */ /* Create the checkmark/indicator (hidden when not checked) */ /* Show the checkmark when checked */ /* Style the checkmark/indicator */ }
#jailbreak-demo .figure-option .container { display: block; position: relative; padding-left: 35px; margin-bottom: 12px; cursor: pointer; font-size: 22px; -webkit-user-select: none; -moz-user-select: none; -ms-user-select: none; user-select: none; }
#jailbreak-demo .figure-option .container input { position: absolute; opacity: 0; cursor: pointer; height: 0; width: 0; }
#jailbreak-demo .figure-option .checkmark { position: absolute; top: 4px; left: 8px; height: 25px; width: 25px; background-color: #eee; }
#jailbreak-demo .figure-option .container:hover input ~ .checkmark { background-color: #ccc; }
#jailbreak-demo .figure-option .container input:checked ~ .checkmark { background-color: #9b9bff; }
#jailbreak-demo .figure-option .checkmark:after { content: ""; position: absolute; display: none; }
#jailbreak-demo .figure-option .container input:checked ~ .checkmark:after { display: block; }
#jailbreak-demo .figure-option .container .checkmark:after { left: 9px; top: 5px; width: 5px; height: 10px; border: solid white; border-width: 0 3px 3px 0; -webkit-transform: rotate(45deg); -ms-transform: rotate(45deg); transform: rotate(45deg); }

#jailbreak-demo .figure { margin: 0 auto; display: block; }

#jailbreak-demo .figure #original { display: none; }

#jailbreak-demo .figure img { user-drag: none; -webkit-user-drag: none; user-select: none; -khtml-user-drag: none; -moz-user-drag: none; -o-user-drag: none; pointer-events: none; position: relative; left: 35px; }

#jailbreak-demo .figure-caption { width: 240px; text-align: center; display: block; margin: 0 auto; padding: 10px 0 0; font-size: .8em; }

#jailbreak-demo .figure-caption ul { padding-left: 0; }

#jailbreak-demo .figure-caption ul li { list-style: none; }

#jailbreak-demo .figure-caption .model-prediction { font-weight: bold; }

#jailbreak-demo .figure-caption .correct { color: #009926; }

#jailbreak-demo .figure-caption .wrong { color: #e31327; }

#jailbreak-demo .attack-success-rate { display: inline-block; width: 60%; margin: 2% auto 8%; padding: 8px 10px; text-align: center; text-decoration: none; background: #DDD; color: #333; border-radius: 10px; user-select: none; }
#jailbreak-demo .attack-success-rate .jailbreak-metric { font-size: 0.75em; display: block; }
#jailbreak-demo .attack-success-rate .attack-success-rate-value { font-size: 1.5em; font-family: "sans-serif"; color: #820000; }

.warning-quote { padding: 15px; font-size: 0.8em; background-color: #f43636ba; color: white; margin-bottom: 15px; border-left: 5px solid #ff3030; transition-duration: 0.3s; }

.closebtn { margin-left: 15px; color: white; font-weight: bold; float: right; font-size: 22px; line-height: 20px; cursor: pointer; transition: 0.3s; }

/* When moving the mouse over the close button */
.closebtn:hover { color: black; }

.slider-container { display: block; margin-top: 1em; margin-bottom: 0.5em; float: left; }

.slider-label { width: 140px; float: left; line-height: 1; }

.slider-content { width: 450px; position: relative; float: right; }

#bin-num, #temp-scale { width: 3em; height: 1.6em; top: 50%; margin-top: -.8em; text-align: center; line-height: 1.6em; }