Commit
·
af929b8
1
Parent(s):
c35e6e6
refine
Browse files- app.py +3 -3
- src/about.py +28 -18
app.py
CHANGED
|
@@ -186,7 +186,7 @@ with demo:
|
|
| 186 |
gr.Markdown(LLM_BENCHMARKS_TEXT, elem_classes="reference-text")
|
| 187 |
|
| 188 |
with gr.Tabs(elem_classes="tab-buttons") as tabs:
|
| 189 |
-
with gr.TabItem("NSFW", elem_id="UnlearnDiffAtk-benchmark-tab-table", id=0):
|
| 190 |
files = ['nudity']
|
| 191 |
with gr.Row():
|
| 192 |
with gr.Column():
|
|
@@ -258,7 +258,7 @@ with demo:
|
|
| 258 |
leaderboard_table,
|
| 259 |
)
|
| 260 |
|
| 261 |
-
with gr.TabItem("Style", elem_id="Style", id=1):
|
| 262 |
files = ['vangogh']
|
| 263 |
with gr.Row():
|
| 264 |
with gr.Column():
|
|
@@ -323,7 +323,7 @@ with demo:
|
|
| 323 |
leaderboard_table,
|
| 324 |
)
|
| 325 |
|
| 326 |
-
with gr.TabItem("Object", elem_id="UnlearnDiffAtk-benchmark-tab-table", id=2):
|
| 327 |
files = ['church','garbage','parachute','tench']
|
| 328 |
with gr.Row():
|
| 329 |
with gr.Column():
|
|
|
|
| 186 |
gr.Markdown(LLM_BENCHMARKS_TEXT, elem_classes="reference-text")
|
| 187 |
|
| 188 |
with gr.Tabs(elem_classes="tab-buttons") as tabs:
|
| 189 |
+
with gr.TabItem("🔞 NSFW", elem_id="UnlearnDiffAtk-benchmark-tab-table", id=0):
|
| 190 |
files = ['nudity']
|
| 191 |
with gr.Row():
|
| 192 |
with gr.Column():
|
|
|
|
| 258 |
leaderboard_table,
|
| 259 |
)
|
| 260 |
|
| 261 |
+
with gr.TabItem("🎨 Style", elem_id="Style", id=1):
|
| 262 |
files = ['vangogh']
|
| 263 |
with gr.Row():
|
| 264 |
with gr.Column():
|
|
|
|
| 323 |
leaderboard_table,
|
| 324 |
)
|
| 325 |
|
| 326 |
+
with gr.TabItem("🪂 Object", elem_id="UnlearnDiffAtk-benchmark-tab-table", id=2):
|
| 327 |
files = ['church','garbage','parachute','tench']
|
| 328 |
with gr.Row():
|
| 329 |
with gr.Column():
|
src/about.py
CHANGED
|
@@ -28,34 +28,44 @@ SUB_TITLE = """<h2 align="center" id="space-title">Effective and efficient adver
|
|
| 28 |
|
| 29 |
# What does your leaderboard evaluate?
|
| 30 |
INTRODUCTION_TEXT = """
|
| 31 |
-
This benchmark evaluates the robustness of safety-driven unlearned diffusion models (DMs)
|
| 32 |
-
|
| 33 |
-
|
| 34 |
Demo of our offensive method: [UnlearnDiffAtk](https://huggingface.co/spaces/Intel/UnlearnDiffAtk)\\
|
| 35 |
Demo of our defensive method: [AdvUnlearn](https://huggingface.co/spaces/Intel/AdvUnlearn)
|
| 36 |
"""
|
| 37 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 38 |
# Which evaluations are you running? how can people reproduce what you have?
|
| 39 |
LLM_BENCHMARKS_TEXT = f"""
|
| 40 |
For more details of Unlearning Methods used in this benchmarks:\\
|
| 41 |
-
|
| 42 |
-
|
| 43 |
-
|
| 44 |
-
|
| 45 |
-
|
| 46 |
-
|
| 47 |
-
|
| 48 |
-
|
|
|
|
| 49 |
|
|
|
|
| 50 |
"""
|
| 51 |
|
| 52 |
-
|
| 53 |
-
Evaluation Metrics: \\
|
| 54 |
-
(1) Pre-attack success rate (pre-ASR), lower is better; \\
|
| 55 |
-
(2) Post-attack success rate (post-ASR), lower is better; \\
|
| 56 |
-
(3) Fréchet inception distance(FID) of images generated by Unlearned Methods, lower is better; \\
|
| 57 |
-
(3) CLIP (Contrastive Language-Image Pretraining) Score is to measure contextual alignment with prompt descriptions, higher is better.
|
| 58 |
-
"""
|
| 59 |
|
| 60 |
CITATION_BUTTON_LABEL = "Copy the following snippet to cite these results"
|
| 61 |
CITATION_BUTTON_TEXT = r"""
|
|
|
|
| 28 |
|
| 29 |
# What does your leaderboard evaluate?
|
| 30 |
INTRODUCTION_TEXT = """
|
| 31 |
+
This benchmark evaluates the <strong>robustness and utility retaining</strong> of safety-driven unlearned diffusion models (DMs) across a variety of tasks. For more details, please visit the [project](https://www.optml-group.com/posts/mu_attack).\\
|
| 32 |
+
- The robustness of unlearned DM is evaluated through our proposed adversarial prompt attack, [UnlearnDiffAtk](https://github.com/OPTML-Group/Diffusion-MU-Attack), which has been accepted to ECCV 2024.\\
|
| 33 |
+
- The utility retaining of unlearned DM is evaluated through FID and CLIP score on the generated images using [10K randomly sampled COCO caption prompts](https://github.com/OPTML-Group/Diffusion-MU-Attack/blob/main/prompts/coco_10k.csv). \\
|
| 34 |
Demo of our offensive method: [UnlearnDiffAtk](https://huggingface.co/spaces/Intel/UnlearnDiffAtk)\\
|
| 35 |
Demo of our defensive method: [AdvUnlearn](https://huggingface.co/spaces/Intel/AdvUnlearn)
|
| 36 |
"""
|
| 37 |
|
| 38 |
+
EVALUATION_QUEUE_TEXT = """
|
| 39 |
+
<strong>Evaluation Metrics</strong>: \\
|
| 40 |
+
- Pre-Attack Success Rate (<strong>Pre-ASR</strong>): lower is better; \\
|
| 41 |
+
- Post-attack success rate (<strong>Post-ASR</strong>): lower is better; \\
|
| 42 |
+
- Fréchet inception distance(<strong>FID</strong>): evaluate distributional quality of image generations, lower is better; \\
|
| 43 |
+
- <strong>CLIP Score</strong>: measure contextual alignment with prompt descriptions, higher is better. \\
|
| 44 |
+
\\
|
| 45 |
+
|
| 46 |
+
<strong>DM Unlearning Tasks</strong>: \\
|
| 47 |
+
- NSFW: Nudity
|
| 48 |
+
- Style: Van Gogh
|
| 49 |
+
- Objects: Church, Tench, Parachute, Garbage Truck
|
| 50 |
+
"""
|
| 51 |
+
|
| 52 |
# Which evaluations are you running? how can people reproduce what you have?
|
| 53 |
LLM_BENCHMARKS_TEXT = f"""
|
| 54 |
For more details of Unlearning Methods used in this benchmarks:\\
|
| 55 |
+
- [Adversarial Unlearning (AdvUnlearn)](https://github.com/OPTML-Group/AdvUnlearn);\\
|
| 56 |
+
- [Erased Stable Diffusion (ESD)](https://github.com/rohitgandikota/erasing);\\
|
| 57 |
+
- [Forget-Me-Not (FMN)](https://github.com/SHI-Labs/Forget-Me-Not);\\
|
| 58 |
+
- [Ablating Concepts (AC)](https://github.com/nupurkmr9/concept-ablation);\\
|
| 59 |
+
- [Unified Concept Editing (UCE)](https://github.com/rohitgandikota/unified-concept-editing);\\
|
| 60 |
+
- [concept-SemiPermeable Membrane (SPM)](https://github.com/Con6924/SPM); \\
|
| 61 |
+
- [Saliency Unlearning (SalUn)](https://github.com/OPTML-Group/Unlearn-Saliency); \\
|
| 62 |
+
- [EraseDiff (ED)](https://github.com/JingWu321/EraseDiff); \\
|
| 63 |
+
- [ScissorHands (SH)](https://github.com/JingWu321/Scissorhands).
|
| 64 |
|
| 65 |
+
We will evaluate your model on UnlearnDiffAtk Benchmark! Open a [github issue](https://github.com/OPTML-Group/Diffusion-MU-Attack/issues) or email us at zhan1853@msu.edu!
|
| 66 |
"""
|
| 67 |
|
| 68 |
+
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 69 |
|
| 70 |
CITATION_BUTTON_LABEL = "Copy the following snippet to cite these results"
|
| 71 |
CITATION_BUTTON_TEXT = r"""
|