feifeinoban commited on
Commit
1e848b8
·
1 Parent(s): c3c15e0

Fix image path for Gradio rendering

Browse files
Files changed (1) hide show
  1. index.html +374 -292
index.html CHANGED
@@ -3,28 +3,170 @@
3
  <head>
4
  <meta charset="utf-8">
5
  <meta name="description"
6
- content="Deformable Neural Radiance Fields creates free-viewpoint portraits (nerfies) from casually captured videos.">
7
- <meta name="keywords" content="Nerfies, D-NeRF, NeRF">
8
  <meta name="viewport" content="width=device-width, initial-scale=1">
9
- <title>Nerfies: Deformable Neural Radiance Fields</title>
10
 
11
  <link href="https://fonts.googleapis.com/css?family=Google+Sans|Noto+Sans|Castoro"
12
  rel="stylesheet">
13
 
14
- <link rel="stylesheet" href="./static/css/bulma.min.css">
15
- <link rel="stylesheet" href="./static/css/bulma-carousel.min.css">
16
- <link rel="stylesheet" href="./static/css/bulma-slider.min.css">
17
- <link rel="stylesheet" href="./static/css/fontawesome.all.min.css">
18
  <link rel="stylesheet"
19
  href="https://cdn.jsdelivr.net/gh/jpswalsh/academicons@1/css/academicons.min.css">
20
- <link rel="stylesheet" href="./static/css/index.css">
21
- <link rel="icon" href="./static/images/favicon.svg">
22
-
23
- <script src="https://ajax.googleapis.com/ajax/libs/jquery/3.5.1/jquery.min.js"></script>
24
- <script defer src="./static/js/fontawesome.all.min.js"></script>
25
- <script src="./static/js/bulma-carousel.min.js"></script>
26
- <script src="./static/js/bulma-slider.min.js"></script>
27
- <script src="./static/js/index.js"></script>
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
28
  </head>
29
  <body>
30
 
@@ -33,39 +175,29 @@
33
  <div class="container is-max-desktop">
34
  <div class="columns is-centered">
35
  <div class="column has-text-centered">
36
- <h1 class="title is-1 publication-title">Nerfies: Deformable Neural Radiance Fields</h1>
37
  <div class="is-size-5 publication-authors">
38
  <span class="author-block">
39
- <a href="https://keunhong.com" target="_blank">Keunhong Park</a><sup>1</sup>,</span>
40
- <span class="author-block">
41
- <a href="https://utkarshsinha.com" target="_blank">Utkarsh Sinha</a><sup>2</sup>,</span>
42
- <span class="author-block">
43
- <a href="https://jonbarron.info" target="_blank">Jonathan T. Barron</a><sup>2</sup>,
44
- </span>
45
  <span class="author-block">
46
- <a href="http://sofienbouaziz.com" target="_blank">Sofien Bouaziz</a><sup>2</sup>,
47
- </span>
48
- <span class="author-block">
49
- <a href="https://www.danbgoldman.com" target="_blank">Dan B Goldman</a><sup>2</sup>,
50
- </span>
51
  <span class="author-block">
52
- <a href="https://homes.cs.washington.edu/~seitz/" target="_blank">Steven M. Seitz</a><sup>1,2</sup>,
53
  </span>
54
  <span class="author-block">
55
- <a href="http://www.ricardomartinbrualla.com" target="_blank">Ricardo Martin-Brualla</a><sup>2</sup>
56
  </span>
57
  </div>
58
 
59
  <div class="is-size-5 publication-authors">
60
- <span class="author-block"><sup>1</sup>University of Washington,</span>
61
- <span class="author-block"><sup>2</sup>Google Research</span>
62
  </div>
63
 
64
  <div class="column has-text-centered">
65
  <div class="publication-links">
66
  <!-- PDF Link. -->
67
  <span class="link-block">
68
- <a href="https://arxiv.org/pdf/2011.12948" target="_blank"
69
  class="external-link button is-normal is-rounded is-dark">
70
  <span class="icon">
71
  <i class="fas fa-file-pdf"></i>
@@ -74,7 +206,7 @@
74
  </a>
75
  </span>
76
  <span class="link-block">
77
- <a href="https://arxiv.org/abs/2011.12948" target="_blank"
78
  class="external-link button is-normal is-rounded is-dark">
79
  <span class="icon">
80
  <i class="ai ai-arxiv"></i>
@@ -82,19 +214,9 @@
82
  <span>arXiv</span>
83
  </a>
84
  </span>
85
- <!-- Video Link. -->
86
- <span class="link-block">
87
- <a href="https://www.youtube.com/watch?v=MrKrnHhk8IA" target="_blank"
88
- class="external-link button is-normal is-rounded is-dark">
89
- <span class="icon">
90
- <i class="fab fa-youtube"></i>
91
- </span>
92
- <span>Video</span>
93
- </a>
94
- </span>
95
  <!-- Code Link. -->
96
  <span class="link-block">
97
- <a href="https://github.com/google/nerfies" target="_blank"
98
  class="external-link button is-normal is-rounded is-dark">
99
  <span class="icon">
100
  <i class="fab fa-github"></i>
@@ -104,15 +226,15 @@
104
  </span>
105
  <!-- Dataset Link. -->
106
  <span class="link-block">
107
- <a href="https://github.com/google/nerfies/releases/tag/0.1" target="_blank"
108
  class="external-link button is-normal is-rounded is-dark">
109
  <span class="icon">
110
  <i class="far fa-images"></i>
111
  </span>
112
- <span>Data</span>
113
  </a>
 
114
  </div>
115
-
116
  </div>
117
  </div>
118
  </div>
@@ -122,314 +244,274 @@
122
 
123
  <section class="hero teaser">
124
  <div class="container is-max-desktop">
125
- <div class="hero-body">
126
- <video id="teaser" autoplay muted loop playsinline height="100%">
127
- <source src="./static/videos/teaser.mp4"
128
- type="video/mp4">
129
- </video>
130
- <h2 class="subtitle has-text-centered">
131
- <span class="dnerf">Nerfies</span> turns selfie videos from your phone into
132
- free-viewpoint
133
- portraits.
134
  </h2>
135
- </div>
136
- </div>
137
- </section>
138
-
139
-
140
- <section class="hero is-light is-small">
141
- <div class="hero-body">
142
- <div class="container">
143
- <div id="results-carousel" class="carousel results-carousel">
144
- <div class="item item-steve">
145
- <video poster="" id="steve" autoplay controls muted loop playsinline height="100%">
146
- <source src="./static/videos/steve.mp4"
147
- type="video/mp4">
148
- </video>
149
- </div>
150
- <div class="item item-chair-tp">
151
- <video poster="" id="chair-tp" autoplay controls muted loop playsinline height="100%">
152
- <source src="./static/videos/chair-tp.mp4"
153
- type="video/mp4">
154
- </video>
155
- </div>
156
- <div class="item item-shiba">
157
- <video poster="" id="shiba" autoplay controls muted loop playsinline height="100%">
158
- <source src="./static/videos/shiba.mp4"
159
- type="video/mp4">
160
- </video>
161
- </div>
162
- <div class="item item-fullbody">
163
- <video poster="" id="fullbody" autoplay controls muted loop playsinline height="100%">
164
- <source src="./static/videos/fullbody.mp4"
165
- type="video/mp4">
166
- </video>
167
- </div>
168
- <div class="item item-blueshirt">
169
- <video poster="" id="blueshirt" autoplay controls muted loop playsinline height="100%">
170
- <source src="./static/videos/blueshirt.mp4"
171
- type="video/mp4">
172
- </video>
173
- </div>
174
- <div class="item item-mask">
175
- <video poster="" id="mask" autoplay controls muted loop playsinline height="100%">
176
- <source src="./static/videos/mask.mp4"
177
- type="video/mp4">
178
- </video>
179
- </div>
180
- <div class="item item-coffee">
181
- <video poster="" id="coffee" autoplay controls muted loop playsinline height="100%">
182
- <source src="./static/videos/coffee.mp4"
183
- type="video/mp4">
184
- </video>
185
- </div>
186
- <div class="item item-toby">
187
- <video poster="" id="toby" autoplay controls muted loop playsinline height="100%">
188
- <source src="./static/videos/toby2.mp4"
189
- type="video/mp4">
190
- </video>
191
- </div>
192
  </div>
193
  </div>
194
  </div>
195
  </section>
196
 
197
-
198
  <section class="section">
199
  <div class="container is-max-desktop">
200
  <!-- Abstract. -->
201
  <div class="columns is-centered has-text-centered">
202
  <div class="column is-four-fifths">
203
  <h2 class="title is-3">Abstract</h2>
204
- <div class="content has-text-justified">
205
- <p>
206
- We present the first method capable of photorealistically reconstructing a non-rigidly
207
- deforming scene using photos/videos captured casually from mobile phones.
208
- </p>
209
- <p>
210
- Our approach augments neural radiance fields
211
- (NeRF) by optimizing an
212
- additional continuous volumetric deformation field that warps each observed point into a
213
- canonical 5D NeRF.
214
- We observe that these NeRF-like deformation fields are prone to local minima, and
215
- propose a coarse-to-fine optimization method for coordinate-based models that allows for
216
- more robust optimization.
217
- By adapting principles from geometry processing and physical simulation to NeRF-like
218
- models, we propose an elastic regularization of the deformation field that further
219
- improves robustness.
220
- </p>
221
- <p>
222
- We show that <span class="dnerf">Nerfies</span> can turn casually captured selfie
223
- photos/videos into deformable NeRF
224
- models that allow for photorealistic renderings of the subject from arbitrary
225
- viewpoints, which we dub <i>"nerfies"</i>. We evaluate our method by collecting data
226
- using a
227
- rig with two mobile phones that take time-synchronized photos, yielding train/validation
228
- images of the same pose at different viewpoints. We show that our method faithfully
229
- reconstructs non-rigidly deforming scenes and reproduces unseen views with high
230
- fidelity.
231
- </p>
232
  </div>
233
  </div>
234
  </div>
235
  <!--/ Abstract. -->
 
 
236
 
237
- <!-- Paper video. -->
238
- <div class="columns is-centered has-text-centered">
239
- <div class="column is-four-fifths">
240
- <h2 class="title is-3">Video</h2>
241
- <div class="publication-video">
242
- <iframe src="https://www.youtube.com/embed/MrKrnHhk8IA?rel=0&amp;showinfo=0"
243
- frameborder="0" allow="autoplay; encrypted-media" allowfullscreen></iframe>
244
  </div>
245
  </div>
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
246
  </div>
247
- <!--/ Paper video. -->
248
  </div>
249
  </section>
250
 
251
-
252
  <section class="section">
253
  <div class="container is-max-desktop">
254
-
255
  <div class="columns is-centered">
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
256
 
257
- <!-- Visual Effects. -->
258
- <div class="column">
259
- <div class="content">
260
- <h2 class="title is-3">Visual Effects</h2>
261
- <p>
262
- Using <i>nerfies</i> you can create fun visual effects. This Dolly zoom effect
263
- would be impossible without nerfies since it would require going through a wall.
264
- </p>
265
- <video id="dollyzoom" autoplay controls muted loop playsinline height="100%">
266
- <source src="./static/videos/dollyzoom-stacked.mp4"
267
- type="video/mp4">
268
- </video>
269
  </div>
270
- </div>
271
- <!--/ Visual Effects. -->
272
 
273
- <!-- Matting. -->
274
- <div class="column">
275
- <h2 class="title is-3">Matting</h2>
276
- <div class="columns is-centered">
277
- <div class="column content">
278
- <p>
279
- As a byproduct of our method, we can also solve the matting problem by ignoring
280
- samples that fall outside of a bounding box during rendering.
281
- </p>
282
- <video id="matting-video" controls playsinline height="100%">
283
- <source src="./static/videos/matting.mp4"
284
- type="video/mp4">
285
- </video>
286
  </div>
 
287
 
 
 
 
 
 
 
 
 
 
288
  </div>
289
  </div>
290
  </div>
291
- <!--/ Matting. -->
 
292
 
293
- <!-- Animation. -->
 
294
  <div class="columns is-centered">
295
- <div class="column is-full-width">
296
- <h2 class="title is-3">Animation</h2>
297
-
298
- <!-- Interpolating. -->
299
- <h3 class="title is-4">Interpolating states</h3>
300
- <div class="content has-text-justified">
301
- <p>
302
- We can also animate the scene by interpolating the deformation latent codes of two input
303
- frames. Use the slider here to linearly interpolate between the left frame and the right
304
- frame.
305
- </p>
306
  </div>
307
- <div class="columns is-vcentered interpolation-panel">
308
- <div class="column is-3 has-text-centered">
309
- <img src="./static/images/interpolate_start.jpg"
310
- class="interpolation-image"
311
- alt="Interpolate start reference image."/>
312
- <p>Start Frame</p>
313
- </div>
314
- <div class="column interpolation-video-column">
315
- <div id="interpolation-image-wrapper">
316
- Loading...
317
- </div>
318
- <input class="slider is-fullwidth is-large is-info"
319
- id="interpolation-slider"
320
- step="1" min="0" max="100" value="0" type="range">
321
- </div>
322
- <div class="column is-3 has-text-centered">
323
- <img src="./static/images/interpolate_end.jpg"
324
- class="interpolation-image"
325
- alt="Interpolation end reference image."/>
326
- <p class="is-bold">End Frame</p>
327
- </div>
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
328
  </div>
329
- <br/>
330
- <!--/ Interpolating. -->
331
 
332
- <!-- Re-rendering. -->
333
- <h3 class="title is-4">Re-rendering the input video</h3>
334
- <div class="content has-text-justified">
335
- <p>
336
- Using <span class="dnerf">Nerfies</span>, you can re-render a video from a novel
337
- viewpoint such as a stabilized camera by playing back the training deformations.
338
  </p>
339
  </div>
340
- <div class="content has-text-centered">
341
- <video id="replay-video"
342
- controls
343
- muted
344
- preload
345
- playsinline
346
- width="75%">
347
- <source src="./static/videos/replay.mp4"
348
- type="video/mp4">
349
- </video>
350
- </div>
351
- <!--/ Re-rendering. -->
352
-
353
  </div>
354
  </div>
355
- <!--/ Animation. -->
356
-
357
 
358
- <!-- Concurrent Work. -->
 
359
  <div class="columns is-centered">
360
- <div class="column is-full-width">
361
- <h2 class="title is-3">Related Links</h2>
362
-
363
- <div class="content has-text-justified">
364
- <p>
365
- There's a lot of excellent work that was introduced around the same time as ours.
366
- </p>
367
- <p>
368
- <a href="https://arxiv.org/abs/2104.09125" target="_blank">Progressive Encoding for Neural Optimization</a> introduces an idea similar to our windowed position encoding for coarse-to-fine optimization.
369
- </p>
370
- <p>
371
- <a href="https://www.albertpumarola.com/research/D-NeRF/index.html" target="_blank">D-NeRF</a> and <a href="https://gvv.mpi-inf.mpg.de/projects/nonrigid_nerf/" target="_blank">NR-NeRF</a>
372
- both use deformation fields to model non-rigid scenes.
373
- </p>
374
- <p>
375
- Some works model videos with a NeRF by directly modulating the density, such as <a href="https://video-nerf.github.io/" target="_blank">Video-NeRF</a>, <a href="https://www.cs.cornell.edu/~zl548/NSFF/" target="_blank">NSFF</a>, and <a href="https://neural-3d-video.github.io/" target="_blank">DyNeRF</a>
376
- </p>
377
- <p>
378
- There are probably many more by the time you are reading this. Check out <a href="https://dellaert.github.io/NeRF/" target="_blank">Frank Dellart's survey on recent NeRF papers</a>, and <a href="https://github.com/yenchenlin/awesome-NeRF" target="_blank">Yen-Chen Lin's curated list of NeRF papers</a>.
379
- </p>
380
  </div>
381
  </div>
382
  </div>
383
- <!--/ Concurrent Work. -->
384
-
385
  </div>
386
  </section>
387
 
388
-
389
  <section class="section" id="BibTeX">
390
  <div class="container is-max-desktop content">
391
  <h2 class="title">BibTeX</h2>
392
- <pre><code>@article{park2021nerfies,
393
- author = {Park, Keunhong and Sinha, Utkarsh and Barron, Jonathan T. and Bouaziz, Sofien and Goldman, Dan B and Seitz, Steven M. and Martin-Brualla, Ricardo},
394
- title = {Nerfies: Deformable Neural Radiance Fields},
395
- journal = {ICCV},
396
- year = {2021},
397
  }</code></pre>
398
  </div>
399
  </section>
400
 
401
-
402
  <footer class="footer">
403
  <div class="container">
404
  <div class="content has-text-centered">
405
- <a class="icon-link" target="_blank"
406
- href="./static/videos/nerfies_paper.pdf">
407
- <i class="fas fa-file-pdf"></i>
408
- </a>
409
- <a class="icon-link" href="https://github.com/keunhong" target="_blank" class="external-link" disabled>
410
- <i class="fab fa-github"></i>
411
- </a>
412
- </div>
413
- <div class="columns is-centered">
414
- <div class="column is-8">
415
- <div class="content">
416
- <p>
417
- This website is licensed under a <a rel="license" target="_blank"
418
- href="http://creativecommons.org/licenses/by-sa/4.0/">Creative
419
- Commons Attribution-ShareAlike 4.0 International License</a>.
420
- </p>
421
- <p>
422
- This means you are free to borrow the <a target="_blank"
423
- href="https://github.com/nerfies/nerfies.github.io">source code</a> of this website,
424
- we just ask that you link back to this page in the footer.
425
- Please remember to remove the analytics code included in the header of the website which
426
- you do not want on your website.
427
- </p>
428
- </div>
429
- </div>
430
  </div>
431
  </div>
432
  </footer>
433
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
434
  </body>
435
- </html>
 
3
  <head>
4
  <meta charset="utf-8">
5
  <meta name="description"
6
+ content="Shell: A Metacognition-Driven Safety Framework for Domain-Specific LLMs">
7
+ <meta name="keywords" content="LLM Safety, Metacognition, AI Alignment, Activation Steering">
8
  <meta name="viewport" content="width=device-width, initial-scale=1">
9
+ <title>Shell: Metacognition-Driven Safety for Domain-Specific LLMs</title>
10
 
11
  <link href="https://fonts.googleapis.com/css?family=Google+Sans|Noto+Sans|Castoro"
12
  rel="stylesheet">
13
 
14
+ <link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/bulma/0.9.3/css/bulma.min.css">
15
+ <link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.0.0/css/all.min.css">
 
 
16
  <link rel="stylesheet"
17
  href="https://cdn.jsdelivr.net/gh/jpswalsh/academicons@1/css/academicons.min.css">
18
+
19
+ <style>
20
+ :root {
21
+ --shell-primary: #3498db;
22
+ --shell-secondary: #9b59b6;
23
+ --shell-accent: #2ecc71;
24
+ }
25
+
26
+ body {
27
+ font-family: 'Google Sans', 'Noto Sans', sans-serif;
28
+ line-height: 1.6;
29
+ }
30
+
31
+ .hero {
32
+ background: linear-gradient(135deg, var(--shell-primary), var(--shell-secondary));
33
+ color: white;
34
+ }
35
+
36
+ .publication-title {
37
+ color: white;
38
+ margin-bottom: 1rem;
39
+ }
40
+
41
+ .publication-authors {
42
+ margin-bottom: 1rem;
43
+ }
44
+
45
+ .author-block {
46
+ display: inline-block;
47
+ margin: 0 0.5rem;
48
+ }
49
+
50
+ .publication-links {
51
+ margin-top: 1.5rem;
52
+ }
53
+
54
+ .link-block {
55
+ display: inline-block;
56
+ margin: 0 0.5rem;
57
+ }
58
+
59
+ .external-link {
60
+ transition: transform 0.2s;
61
+ }
62
+
63
+ .external-link:hover {
64
+ transform: translateY(-2px);
65
+ }
66
+
67
+ .teaser {
68
+ padding: 4rem 0;
69
+ }
70
+
71
+ .teaser video {
72
+ border-radius: 10px;
73
+ box-shadow: 0 10px 30px rgba(0,0,0,0.3);
74
+ }
75
+
76
+ .dnerf {
77
+ font-weight: bold;
78
+ color: var(--shell-primary);
79
+ }
80
+
81
+ .results-carousel {
82
+ margin: 2rem 0;
83
+ }
84
+
85
+ .section {
86
+ padding: 4rem 1.5rem;
87
+ }
88
+
89
+ .content h2, .content h3 {
90
+ color: var(--shell-primary);
91
+ border-bottom: 2px solid #f5f5f5;
92
+ padding-bottom: 0.5rem;
93
+ margin-top: 2rem;
94
+ }
95
+
96
+ .table-container {
97
+ margin: 2rem 0;
98
+ box-shadow: 0 5px 15px rgba(0,0,0,0.1);
99
+ border-radius: 10px;
100
+ overflow: hidden;
101
+ }
102
+
103
+ table {
104
+ width: 100%;
105
+ }
106
+
107
+ table th {
108
+ background: linear-gradient(135deg, var(--shell-primary), var(--shell-secondary));
109
+ color: white;
110
+ font-weight: 600;
111
+ }
112
+
113
+ .badge {
114
+ display: inline-block;
115
+ padding: 0.5rem 1rem;
116
+ background: var(--shell-primary);
117
+ color: white;
118
+ border-radius: 20px;
119
+ margin: 0.25rem;
120
+ font-size: 0.9rem;
121
+ text-decoration: none;
122
+ }
123
+
124
+ .badge:hover {
125
+ background: var(--shell-secondary);
126
+ color: white;
127
+ }
128
+
129
+ .abstract-box {
130
+ background: linear-gradient(135deg, #f8f9fa, #e9ecef);
131
+ padding: 2rem;
132
+ border-radius: 10px;
133
+ border-left: 5px solid var(--shell-primary);
134
+ margin: 2rem 0;
135
+ }
136
+
137
+ .methodology-step {
138
+ margin: 2rem 0;
139
+ padding: 1.5rem;
140
+ border-radius: 10px;
141
+ background: white;
142
+ box-shadow: 0 5px 15px rgba(0,0,0,0.1);
143
+ border-left: 4px solid var(--shell-accent);
144
+ }
145
+
146
+ .results-highlight {
147
+ text-align: center;
148
+ padding: 2rem;
149
+ background: linear-gradient(135deg, var(--shell-primary), var(--shell-secondary));
150
+ color: white;
151
+ border-radius: 10px;
152
+ margin: 2rem 0;
153
+ }
154
+
155
+ .results-highlight .number {
156
+ font-size: 3rem;
157
+ font-weight: bold;
158
+ display: block;
159
+ }
160
+
161
+ .architecture-image {
162
+ width: 100%;
163
+ max-width: 800px;
164
+ display: block;
165
+ margin: 2rem auto;
166
+ border-radius: 10px;
167
+ box-shadow: 0 10px 30px rgba(0,0,0,0.2);
168
+ }
169
+ </style>
170
  </head>
171
  <body>
172
 
 
175
  <div class="container is-max-desktop">
176
  <div class="columns is-centered">
177
  <div class="column has-text-centered">
178
+ <h1 class="title is-1 publication-title">🐚 Shell: Metacognition-Driven Safety Framework for Domain-Specific LLMs</h1>
179
  <div class="is-size-5 publication-authors">
180
  <span class="author-block">
181
+ <a href="#" target="_blank">Wen Wu</a><sup>1</sup>,</span>
 
 
 
 
 
182
  <span class="author-block">
183
+ <a href="#" target="_blank">Zhenyu Ying</a><sup>1</sup>,</span>
 
 
 
 
184
  <span class="author-block">
185
+ <a href="#" target="_blank">Liang He</a><sup>1</sup>,
186
  </span>
187
  <span class="author-block">
188
+ <a href="#" target="_blank">Shell Team</a><sup>1</sup>
189
  </span>
190
  </div>
191
 
192
  <div class="is-size-5 publication-authors">
193
+ <span class="author-block"><sup>1</sup>Anonymous Submission</span>
 
194
  </div>
195
 
196
  <div class="column has-text-centered">
197
  <div class="publication-links">
198
  <!-- PDF Link. -->
199
  <span class="link-block">
200
+ <a href="#" target="_blank"
201
  class="external-link button is-normal is-rounded is-dark">
202
  <span class="icon">
203
  <i class="fas fa-file-pdf"></i>
 
206
  </a>
207
  </span>
208
  <span class="link-block">
209
+ <a href="#" target="_blank"
210
  class="external-link button is-normal is-rounded is-dark">
211
  <span class="icon">
212
  <i class="ai ai-arxiv"></i>
 
214
  <span>arXiv</span>
215
  </a>
216
  </span>
 
 
 
 
 
 
 
 
 
 
217
  <!-- Code Link. -->
218
  <span class="link-block">
219
+ <a href="#" target="_blank"
220
  class="external-link button is-normal is-rounded is-dark">
221
  <span class="icon">
222
  <i class="fab fa-github"></i>
 
226
  </span>
227
  <!-- Dataset Link. -->
228
  <span class="link-block">
229
+ <a href="#" target="_blank"
230
  class="external-link button is-normal is-rounded is-dark">
231
  <span class="icon">
232
  <i class="far fa-images"></i>
233
  </span>
234
+ <span>Dataset</span>
235
  </a>
236
+ </span>
237
  </div>
 
238
  </div>
239
  </div>
240
  </div>
 
244
 
245
  <section class="hero teaser">
246
  <div class="container is-max-desktop">
247
+ <div class="hero-body has-text-centered">
248
+ <h2 class="subtitle is-3">
249
+ Uncover and mitigate <span class="dnerf">implicit value risks</span> in education, finance, management—and beyond
 
 
 
 
 
 
250
  </h2>
251
+ <div class="content">
252
+ <a href="#" class="badge">🔒 Model-agnostic</a>
253
+ <a href="#" class="badge">🧠 Self-evolving rules</a>
254
+ <a href="#" class="badge">⚡ Activation steering</a>
255
+ <a href="#" class="badge">📉 90%+ jailbreak reduction</a>
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
256
  </div>
257
  </div>
258
  </div>
259
  </section>
260
 
 
261
  <section class="section">
262
  <div class="container is-max-desktop">
263
  <!-- Abstract. -->
264
  <div class="columns is-centered has-text-centered">
265
  <div class="column is-four-fifths">
266
  <h2 class="title is-3">Abstract</h2>
267
+ <div class="abstract-box">
268
+ <div class="content has-text-justified">
269
+ <p>
270
+ While current LLM safety methods focus on explicit harms (e.g., hate speech, violence), they often miss <strong>domain-specific implicit risks</strong>—such as encouraging academic dishonesty in education, promoting reckless trading in finance, or normalizing toxic workplace culture in management.
271
+ </p>
272
+ <p>
273
+ We introduce <strong>Shell</strong>, a metacognition-driven self-evolution framework that enables LLMs to self-diagnose value misalignments via perspective-taking and consequence simulation, builds a hybrid rule system with expert-defined static trees and self-evolved dynamic graphs, and enforces rules at inference time via activation steering.
274
+ </p>
275
+ <p>
276
+ Evaluated on 9,000 risk queries across <strong>education, finance, and management</strong>, Shell reduces average jailbreak rates by <strong>>90%</strong> on models including GPT-5, Qwen3, and Llama 3.1.
277
+ </p>
278
+ </div>
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
279
  </div>
280
  </div>
281
  </div>
282
  <!--/ Abstract. -->
283
+ </div>
284
+ </section>
285
 
286
+ <section class="hero is-light is-small">
287
+ <div class="hero-body">
288
+ <div class="container">
289
+ <div class="columns is-centered">
290
+ <div class="column is-8 has-text-centered">
291
+ <h2 class="title is-3">Core Challenges: Implicit Risks Are Everywhere</h2>
 
292
  </div>
293
  </div>
294
+ <div class="table-container">
295
+ <table class="table is-striped is-fullwidth">
296
+ <thead>
297
+ <tr>
298
+ <th>Domain</th>
299
+ <th>Example Implicit Risk</th>
300
+ <th>Harmful Consequence</th>
301
+ </tr>
302
+ </thead>
303
+ <tbody>
304
+ <tr>
305
+ <td><strong>Education</strong></td>
306
+ <td>Suggesting clever comebacks that escalate bullying</td>
307
+ <td>Deteriorates peer relationships</td>
308
+ </tr>
309
+ <tr>
310
+ <td></td>
311
+ <td>Framing "sacrificing sleep for grades" as admirable</td>
312
+ <td>Promotes unhealthy competition</td>
313
+ </tr>
314
+ <tr>
315
+ <td></td>
316
+ <td>Teaching how to "rephrase copied essays"</td>
317
+ <td>Undermines academic integrity</td>
318
+ </tr>
319
+ <tr>
320
+ <td><strong>Finance</strong></td>
321
+ <td>Encouraging high-leverage speculation as "smart risk"</td>
322
+ <td>Normalizes financial recklessness</td>
323
+ </tr>
324
+ <tr>
325
+ <td><strong>Management</strong></td>
326
+ <td>Praising "always-on" culture as "dedication"</td>
327
+ <td>Reinforces burnout and poor work-life balance</td>
328
+ </tr>
329
+ </tbody>
330
+ </table>
331
+ </div>
332
+ <div class="has-text-centered">
333
+ <p class="is-italic">
334
+ 💡 These risks are <strong>not jailbreaks</strong> in the traditional sense—they appear benign but subtly erode domain-specific values.
335
+ </p>
336
+ </div>
337
  </div>
 
338
  </div>
339
  </section>
340
 
 
341
  <section class="section">
342
  <div class="container is-max-desktop">
 
343
  <div class="columns is-centered">
344
+ <div class="column is-four-fifths">
345
+ <h2 class="title is-3">Methodology: The MENTOR Architecture</h2>
346
+
347
+ <div class="methodology-step">
348
+ <h3 class="title is-4">1. Metacognitive Self-Assessment</h3>
349
+ <div class="content">
350
+ <p>LLMs evaluate their own outputs using:</p>
351
+ <ul>
352
+ <li><strong>Perspective-taking</strong>: "How would a teacher/parent/regulator view this?"</li>
353
+ <li><strong>Consequential thinking</strong>: "What real-world harm could this cause?"</li>
354
+ <li><strong>Normative introspection</strong>: "Does this align with core domain ethics?"</li>
355
+ </ul>
356
+ <p>This replaces labor-intensive human labeling with <strong>autonomous, human-aligned reflection</strong>.</p>
357
+ </div>
358
+ </div>
359
 
360
+ <div class="methodology-step">
361
+ <h3 class="title is-4">2. Rule Evolution Cycle (REC)</h3>
362
+ <div class="content">
363
+ <ul>
364
+ <li><strong>Static Rule Tree</strong>: Expert-curated, hierarchical rules (e.g., <code>Education → Academic Integrity → No Plagiarism</code>).</li>
365
+ <li><strong>Dynamic Rule Graph</strong>: Automatically generated from successful self-corrections (e.g., <code>&lt;risk: essay outsourcing&gt; → &lt;rule: teach outlining instead&gt;</code>).</li>
366
+ <li>Rules evolve via <strong>dual clustering</strong> (by risk type & mitigation strategy), enabling precise retrieval.</li>
367
+ </ul>
368
+ </div>
 
 
 
369
  </div>
 
 
370
 
371
+ <div class="methodology-step">
372
+ <h3 class="title is-4">3. Robust Rule Vectors (RV) via Activation Steering</h3>
373
+ <div class="content">
374
+ <ul>
375
+ <li>Generate <strong>steering vectors</strong> from contrasting compliant vs. non-compliant responses.</li>
376
+ <li>At inference, <strong>add vectors to internal activations</strong> (e.g., Layer 18 of Llama 3.1) to guide behavior.</li>
377
+ <li><strong>No fine-tuning needed</strong>—works on closed-source models like GPT-5.</li>
378
+ </ul>
 
 
 
 
 
379
  </div>
380
+ </div>
381
 
382
+ <!-- Architecture Image -->
383
+ <img src="https://huggingface.co/spaces/feifeinoban/shell/resolve/main/assets/mentor_arch.png"
384
+ alt="MENTOR Architecture"
385
+ class="architecture-image">
386
+
387
+ <div class="has-text-centered">
388
+ <p class="is-italic">
389
+ Figure: The MENTOR framework. Shell implements this full pipeline.
390
+ </p>
391
  </div>
392
  </div>
393
  </div>
394
+ </div>
395
+ </section>
396
 
397
+ <section class="section">
398
+ <div class="container is-max-desktop">
399
  <div class="columns is-centered">
400
+ <div class="column is-four-fifths">
401
+ <h2 class="title is-3">Results: Strong, Efficient, Generalizable</h2>
402
+
403
+ <div class="results-highlight">
404
+ <span class="number">>90%</span>
405
+ <span class="subtitle">Average Jailbreak Rate Reduction</span>
 
 
 
 
 
406
  </div>
407
+
408
+ <h3 class="title is-4">Jailbreak Rate Reduction (3,000 queries per domain)</h3>
409
+
410
+ <div class="table-container">
411
+ <table class="table is-striped is-fullwidth">
412
+ <thead>
413
+ <tr>
414
+ <th>Model</th>
415
+ <th>Original</th>
416
+ <th>+ Shell (Rules + MetaLoop + RV)</th>
417
+ <th>Reduction</th>
418
+ </tr>
419
+ </thead>
420
+ <tbody>
421
+ <tr>
422
+ <td><strong>GPT-5</strong></td>
423
+ <td>38.39%</td>
424
+ <td><strong>0.77%</strong></td>
425
+ <td><strong>98.0%</strong></td>
426
+ </tr>
427
+ <tr>
428
+ <td><strong>Qwen3-235B</strong></td>
429
+ <td>56.33%</td>
430
+ <td><strong>3.13%</strong></td>
431
+ <td><strong>94.4%</strong></td>
432
+ </tr>
433
+ <tr>
434
+ <td><strong>GPT-4o</strong></td>
435
+ <td>58.81%</td>
436
+ <td><strong>6.43%</strong></td>
437
+ <td><strong>89.1%</strong></td>
438
+ </tr>
439
+ <tr>
440
+ <td><strong>Llama 3.1-8B</strong></td>
441
+ <td>67.45%</td>
442
+ <td><strong>31.39%</strong></td>
443
+ <td><strong>53.5%</strong></td>
444
+ </tr>
445
+ </tbody>
446
+ </table>
447
  </div>
 
 
448
 
449
+ <div class="has-text-centered">
450
+ <p class="is-italic">
451
+ Human evaluators prefer Shell-augmented responses <strong>68% of the time</strong> for safety, appropriateness, and usefulness.
 
 
 
452
  </p>
453
  </div>
 
 
 
 
 
 
 
 
 
 
 
 
 
454
  </div>
455
  </div>
456
+ </div>
457
+ </section>
458
 
459
+ <section class="section">
460
+ <div class="container is-max-desktop">
461
  <div class="columns is-centered">
462
+ <div class="column is-four-fifths">
463
+ <h2 class="title is-3">Try It / Use It</h2>
464
+
465
+ <div class="content">
466
+ <h3 class="title is-4">For Researchers</h3>
467
+ <ul>
468
+ <li><strong>Dataset</strong>: 9,000 implicit-risk queries across 3 domains → [HF Dataset Link]</li>
469
+ <li><strong>Code</strong>: Full implementation of REC + RV → [GitHub Link] (coming soon)</li>
470
+ </ul>
 
 
 
 
 
 
 
 
 
 
 
471
  </div>
472
  </div>
473
  </div>
 
 
474
  </div>
475
  </section>
476
 
 
477
  <section class="section" id="BibTeX">
478
  <div class="container is-max-desktop content">
479
  <h2 class="title">BibTeX</h2>
480
+ <pre><code>@article{shell2025,
481
+ title={Shell: A Metacognition-Driven Safety Framework for Domain-Specific LLMs},
482
+ author={Wu, Wen and Ying, Zhenyu and He, Liang and Team, Shell},
483
+ journal={Anonymous Submission},
484
+ year={2025}
485
  }</code></pre>
486
  </div>
487
  </section>
488
 
 
489
  <footer class="footer">
490
  <div class="container">
491
  <div class="content has-text-centered">
492
+ <p>
493
+ This website is licensed under a <a rel="license" target="_blank"
494
+ href="http://creativecommons.org/licenses/by-sa/4.0/">Creative
495
+ Commons Attribution-ShareAlike 4.0 International License</a>.
496
+ </p>
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
497
  </div>
498
  </div>
499
  </footer>
500
 
501
+ <script>
502
+ // Simple JavaScript for interactive elements if needed
503
+ document.addEventListener('DOMContentLoaded', function() {
504
+ // Add smooth scrolling for anchor links
505
+ document.querySelectorAll('a[href^="#"]').forEach(anchor => {
506
+ anchor.addEventListener('click', function (e) {
507
+ e.preventDefault();
508
+ document.querySelector(this.getAttribute('href')).scrollIntoView({
509
+ behavior: 'smooth'
510
+ });
511
+ });
512
+ });
513
+ });
514
+ </script>
515
+
516
  </body>
517
+ </html>