Spaces:
Running
Running
Update index.html
Browse files- index.html +9 -168
index.html
CHANGED
|
@@ -1,168 +1,9 @@
|
|
| 1 |
-
|
| 2 |
-
<
|
| 3 |
-
<
|
| 4 |
-
|
| 5 |
-
|
| 6 |
-
|
| 7 |
-
|
| 8 |
-
|
| 9 |
-
|
| 10 |
-
<meta property="og:description" content="Zero-Shot Unsupervised and Text-Based Audio Editing Using DDPM Inversion" />
|
| 11 |
-
|
| 12 |
-
<!-- Tailwind CSS -->
|
| 13 |
-
<script src="https://cdn.tailwindcss.com"></script>
|
| 14 |
-
<!-- Google Fonts: Poppins -->
|
| 15 |
-
<link href="https://fonts.googleapis.com/css2?family=Poppins:wght@400;600;700&display=swap" rel="stylesheet">
|
| 16 |
-
<!-- Font Awesome -->
|
| 17 |
-
<script src="https://kit.fontawesome.com/ad96f96272.js" crossorigin="anonymous"></script>
|
| 18 |
-
<!-- Academicons -->
|
| 19 |
-
<link rel="stylesheet" href="https://cdn.jsdelivr.net/gh/jpswalsh/academicons@1/css/academicons.min.css">
|
| 20 |
-
|
| 21 |
-
<style>
|
| 22 |
-
body {
|
| 23 |
-
font-family: 'Poppins', sans-serif;
|
| 24 |
-
background: linear-gradient(135deg, #1e293b 0%, #0f172a 100%);
|
| 25 |
-
color: #f1f5f9;
|
| 26 |
-
min-height: 100vh;
|
| 27 |
-
}
|
| 28 |
-
.glass {
|
| 29 |
-
background: rgba(30, 41, 59, 0.7);
|
| 30 |
-
box-shadow: 0 8px 32px 0 rgba(31, 38, 135, 0.37);
|
| 31 |
-
backdrop-filter: blur(8px);
|
| 32 |
-
border-radius: 1rem;
|
| 33 |
-
border: 1px solid rgba(255,255,255,0.08);
|
| 34 |
-
}
|
| 35 |
-
.gradient-btn {
|
| 36 |
-
background: linear-gradient(90deg, #2563eb 0%, #1e40af 100%);
|
| 37 |
-
color: #fff;
|
| 38 |
-
transition: transform 0.2s, box-shadow 0.2s;
|
| 39 |
-
}
|
| 40 |
-
.gradient-btn:hover {
|
| 41 |
-
transform: translateY(-2px) scale(1.03);
|
| 42 |
-
box-shadow: 0 4px 20px 0 rgba(37,99,235,0.25);
|
| 43 |
-
background: linear-gradient(90deg, #1e40af 0%, #2563eb 100%);
|
| 44 |
-
}
|
| 45 |
-
.audio-player {
|
| 46 |
-
width: 100%;
|
| 47 |
-
max-width: 260px;
|
| 48 |
-
background: #1e293b;
|
| 49 |
-
border-radius: 0.5rem;
|
| 50 |
-
box-shadow: 0 2px 8px rgba(16, 24, 39, 0.2);
|
| 51 |
-
padding: 0.5rem;
|
| 52 |
-
}
|
| 53 |
-
::selection {
|
| 54 |
-
background: #2563eb;
|
| 55 |
-
color: #fff;
|
| 56 |
-
}
|
| 57 |
-
</style>
|
| 58 |
-
</head>
|
| 59 |
-
<body>
|
| 60 |
-
<!-- Navigation Bar -->
|
| 61 |
-
<nav class="glass sticky top-0 z-50 flex items-center justify-between px-6 py-4 shadow-lg">
|
| 62 |
-
<a href="#" class="text-2xl font-bold tracking-tight bg-gradient-to-r from-blue-400 to-indigo-500 bg-clip-text text-transparent">Zero-Shot Audio Editing</a>
|
| 63 |
-
<div class="hidden md:flex space-x-6">
|
| 64 |
-
<a href="#supsamples" class="hover:text-blue-400 transition">Text-based Editing</a>
|
| 65 |
-
<a href="#unsupsamples" class="hover:text-blue-400 transition">Unsup. Editing</a>
|
| 66 |
-
<a href="#supcomparisons" class="hover:text-blue-400 transition">Text-Based Editing Comp.</a>
|
| 67 |
-
<a href="#unsupcomparisons" class="hover:text-blue-400 transition">Unsup. Editing Comp.</a>
|
| 68 |
-
</div>
|
| 69 |
-
<button class="md:hidden text-2xl"><i class="fas fa-bars"></i></button>
|
| 70 |
-
</nav>
|
| 71 |
-
|
| 72 |
-
<!-- Header Section -->
|
| 73 |
-
<header class="max-w-3xl mx-auto mt-12 text-center glass py-10 px-6">
|
| 74 |
-
<h1 class="text-4xl md:text-5xl font-extrabold mb-4 bg-gradient-to-r from-blue-400 to-indigo-500 bg-clip-text text-transparent">
|
| 75 |
-
Zero-Shot Unsupervised and Text-Based Audio Editing Using DDPM Inversion
|
| 76 |
-
</h1>
|
| 77 |
-
<h4 class="text-xl md:text-2xl font-semibold mb-2">ICML 2024</h4>
|
| 78 |
-
<div class="flex flex-wrap justify-center gap-4 mb-2">
|
| 79 |
-
<a href="https://www.linkedin.com/in/hilamanor/" target="_blank" class="text-lg hover:text-blue-400 transition">Hila Manor</a>
|
| 80 |
-
<span class="text-gray-400">|</span>
|
| 81 |
-
<a href="https://tomer.net.technion.ac.il/" target="_blank" class="text-lg hover:text-blue-400 transition">Tomer Michaeli</a>
|
| 82 |
-
</div>
|
| 83 |
-
<p class="mb-4 text-gray-300">Technion - Israel Institute of Technology</p>
|
| 84 |
-
<div class="flex flex-wrap justify-center gap-4 mt-4">
|
| 85 |
-
<a class="gradient-btn px-5 py-2 rounded-lg font-semibold flex items-center gap-2" href="https://arxiv.org/abs/2402.10009" target="_blank"><i class="ai ai-arxiv"></i>ArXiv</a>
|
| 86 |
-
<a class="gradient-btn px-5 py-2 rounded-lg font-semibold flex items-center gap-2" href="https://github.com/HilaManor/AudioEditingCode/" target="_blank"><i class="fab fa-github"></i>Code</a>
|
| 87 |
-
<a class="gradient-btn px-5 py-2 rounded-lg font-semibold flex items-center gap-2" href="https://youtu.be/lBnldOQVbS4" target="_blank"><i class="fab fa-youtube"></i>Presentation</a>
|
| 88 |
-
<a class="gradient-btn px-5 py-2 rounded-lg font-semibold flex items-center gap-2" href="https://huggingface.co/spaces/hilamanor/audioEditing/" target="_blank">🤗 Text-Based Space</a>
|
| 89 |
-
</div>
|
| 90 |
-
</header>
|
| 91 |
-
|
| 92 |
-
<!-- Abstract and Teaser -->
|
| 93 |
-
<section class="max-w-3xl mx-auto my-12 glass py-8 px-6 text-center">
|
| 94 |
-
<img alt="Teaser" src="https://github.com/HilaManor/AudioEditingCode/raw/refs/heads/codeclean/docs/resources/teaser.png" class="mx-auto rounded-xl shadow-xl mb-6 w-full md:w-3/4"/>
|
| 95 |
-
<h2 class="text-2xl font-semibold mb-4">Abstract</h2>
|
| 96 |
-
<p class="text-lg leading-relaxed text-gray-200">
|
| 97 |
-
Editing signals using large pre-trained models, in a zero-shot manner, has recently seen rapid advancements in the image domain. However, this wave has yet to reach the audio domain.
|
| 98 |
-
In this paper, we explore two zero-shot editing techniques for audio signals, which use DDPM inversion on pre-trained diffusion models. The first, adopted from the image domain, allows text-based editing.
|
| 99 |
-
The second, is a novel approach for discovering semantically meaningful editing directions without supervision.
|
| 100 |
-
When applied to music signals, this method exposes a range of musically interesting modifications, from controlling the participation of specific instruments to improvisations on the melody.
|
| 101 |
-
</p>
|
| 102 |
-
</section>
|
| 103 |
-
|
| 104 |
-
<!-- Video Overview -->
|
| 105 |
-
<section class="max-w-3xl mx-auto my-12 glass py-8 px-6 text-center">
|
| 106 |
-
<h2 class="text-2xl font-semibold mb-2">Video Overview</h2>
|
| 107 |
-
<p class="text-gray-300 mb-4">For people in a hurry. Images generated by <a href="https://openai.com/dall-e-2" class="text-blue-400 hover:underline">DALL-E 2</a> and <a href="https://www.bing.com/copilot" class="text-blue-400 hover:underline">Copilot</a>.</p>
|
| 108 |
-
<video controls class="mx-auto rounded-xl shadow-xl w-full max-w-md">
|
| 109 |
-
<source src="https://github.com/HilaManor/AudioEditingCode/raw/refs/heads/codeclean/docs/resources/overview.mp4" type="video/mp4">
|
| 110 |
-
Your browser does not support the video tag.
|
| 111 |
-
</video>
|
| 112 |
-
</section>
|
| 113 |
-
|
| 114 |
-
<!-- Samples of Editing -->
|
| 115 |
-
<section class="max-w-5xl mx-auto my-12 glass py-8 px-6">
|
| 116 |
-
<h2 class="text-2xl font-semibold text-center mb-4">1. Samples of Editing</h2>
|
| 117 |
-
<p class="text-center text-gray-300 mb-8">We present samples of audio editing using our proposed methods. The samples are organized into two sections: text-based editing and unsupervised editing.</p>
|
| 118 |
-
|
| 119 |
-
<!-- Text-Based Editing Table -->
|
| 120 |
-
<div>
|
| 121 |
-
<h3 id="supsamples" class="text-xl font-semibold mb-4">1.1. Samples of Text-Based Editing</h3>
|
| 122 |
-
<div class="overflow-x-auto">
|
| 123 |
-
<table class="min-w-full text-sm text-left text-gray-200">
|
| 124 |
-
<thead class="bg-blue-900/80">
|
| 125 |
-
<tr>
|
| 126 |
-
<th class="px-4 py-2">#</th>
|
| 127 |
-
<th class="px-4 py-2">Source Prompt</th>
|
| 128 |
-
<th class="px-4 py-2">Target Prompt</th>
|
| 129 |
-
<th class="px-4 py-2">Original Audio</th>
|
| 130 |
-
<th class="px-4 py-2">Edited Audio</th>
|
| 131 |
-
<th class="px-4 py-2">Edit T<sub>start</sub></th>
|
| 132 |
-
</tr>
|
| 133 |
-
</thead>
|
| 134 |
-
<tbody>
|
| 135 |
-
<tr class="hover:bg-blue-800/30 transition">
|
| 136 |
-
<td class="px-4 py-2">1</td>
|
| 137 |
-
<td class="px-4 py-2">A recording of a <b>sneaky jazz</b> song.</td>
|
| 138 |
-
<td class="px-4 py-2">A recording of a <b>tense classical</b> music score.</td>
|
| 139 |
-
<td class="px-4 py-2"><audio controls class="audio-player"><source src="https://github.com/HilaManor/AudioEditingCode/raw/refs/heads/codeclean/docs/resources/audio/orig/MDDBFreeJazz.mp3" type="audio/mp4"></audio></td>
|
| 140 |
-
<td class="px-4 py-2"><audio controls class="audio-player"><source src="https://github.com/HilaManor/AudioEditingCode/raw/refs/heads/codeclean/docs/resources/audio/sup_samples/orchestra_MDDBFreeJazz_ours_90.mp3" type="audio/mp4"></audio></td>
|
| 141 |
-
<td class="px-4 py-2 text-center">110</td>
|
| 142 |
-
</tr>
|
| 143 |
-
<!-- Repeat for other rows as needed ... -->
|
| 144 |
-
</tbody>
|
| 145 |
-
</table>
|
| 146 |
-
</div>
|
| 147 |
-
</div>
|
| 148 |
-
<!-- Add more sections as needed -->
|
| 149 |
-
</section>
|
| 150 |
-
|
| 151 |
-
<!-- Back to Top Button -->
|
| 152 |
-
<button onclick="window.scrollTo({top: 0, behavior: 'smooth'});" class="fixed bottom-8 right-8 gradient-btn rounded-full p-4 shadow-xl hover:scale-110 transition hidden md:block" aria-label="Back to top">
|
| 153 |
-
<i class="fas fa-arrow-up"></i>
|
| 154 |
-
</button>
|
| 155 |
-
|
| 156 |
-
<script>
|
| 157 |
-
// Show back-to-top button on scroll
|
| 158 |
-
window.addEventListener('scroll', function() {
|
| 159 |
-
const btn = document.querySelector('.fixed.bottom-8.right-8');
|
| 160 |
-
if (window.scrollY > 300) {
|
| 161 |
-
btn.classList.remove('hidden');
|
| 162 |
-
} else {
|
| 163 |
-
btn.classList.add('hidden');
|
| 164 |
-
}
|
| 165 |
-
});
|
| 166 |
-
</script>
|
| 167 |
-
</body>
|
| 168 |
-
</html>
|
|
|
|
| 1 |
+
<div class="container-xl px-2 sm:px-4 lg:px-8">
|
| 2 |
+
<div class="text-center py-6 md:py-12">
|
| 3 |
+
<h1 class="text-2xl md:text-4xl font-bold mb-2">Zero-Shot Audio Editing</h1>
|
| 4 |
+
<div class="flex flex-col md:flex-row justify-center gap-3 md:gap-6 mt-4">
|
| 5 |
+
<a href="#" class="w-full md:w-auto btn btn-outline-primary text-base md:text-lg py-2">ArXiv</a>
|
| 6 |
+
<a href="#" class="w-full md:w-auto btn btn-outline-primary text-base md:text-lg py-2">Code</a>
|
| 7 |
+
</div>
|
| 8 |
+
</div>
|
| 9 |
+
</div>
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|