Spaces:
Running
Running
Update index.html
Browse files- index.html +168 -8
index.html
CHANGED
|
@@ -1,9 +1,169 @@
|
|
| 1 |
-
|
| 2 |
-
|
| 3 |
-
|
| 4 |
-
|
| 5 |
-
|
| 6 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 7 |
</div>
|
| 8 |
-
</
|
| 9 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
<!DOCTYPE html>
|
| 2 |
+
<html lang="en">
|
| 3 |
+
<head>
|
| 4 |
+
<meta charset="utf-8">
|
| 5 |
+
<meta name="viewport" content="width=device-width, initial-scale=1">
|
| 6 |
+
<title>Zero-Shot Unsupervised and Text-Based Audio Editing Using DDPM Inversion</title>
|
| 7 |
+
<link rel="shortcut icon" href="https://github.com/HilaManor/AudioEditingCode/raw/refs/heads/codeclean/docs/resources/favicon.ico">
|
| 8 |
+
<meta property="og:image" content="https://github.com/HilaManor/AudioEditingCode/raw/refs/heads/codeclean/docs/resources/teaser.png"/>
|
| 9 |
+
<meta property="og:title" content="Zero-Shot Unsupervised and Text-Based Audio Editing Using DDPM Inversion" />
|
| 10 |
+
<meta property="og:description" content="Zero-Shot Unsupervised and Text-Based Audio Editing Using DDPM Inversion" />
|
| 11 |
+
<!-- Tailwind CSS -->
|
| 12 |
+
<script src="https://cdn.tailwindcss.com"></script>
|
| 13 |
+
<!-- Google Fonts: Poppins -->
|
| 14 |
+
<link href="https://fonts.googleapis.com/css2?family=Poppins:wght@400;600;700&display=swap" rel="stylesheet">
|
| 15 |
+
<!-- Font Awesome -->
|
| 16 |
+
<script src="https://kit.fontawesome.com/ad96f96272.js" crossorigin="anonymous"></script>
|
| 17 |
+
<!-- Academicons -->
|
| 18 |
+
<link rel="stylesheet" href="https://cdn.jsdelivr.net/gh/jpswalsh/academicons@1/css/academicons.min.css">
|
| 19 |
+
<style>
|
| 20 |
+
body {
|
| 21 |
+
font-family: 'Poppins', sans-serif;
|
| 22 |
+
background: linear-gradient(135deg, #1e293b 0%, #0f172a 100%);
|
| 23 |
+
color: #f1f5f9;
|
| 24 |
+
min-height: 100vh;
|
| 25 |
+
}
|
| 26 |
+
::selection {
|
| 27 |
+
background: #2563eb;
|
| 28 |
+
color: #fff;
|
| 29 |
+
}
|
| 30 |
+
</style>
|
| 31 |
+
</head>
|
| 32 |
+
<body class="bg-gradient-to-br from-slate-900 to-slate-800 min-h-screen">
|
| 33 |
+
<!-- Navigation Bar -->
|
| 34 |
+
<nav class="bg-gradient-to-r from-blue-600 to-blue-800 shadow-lg sticky top-0 z-50">
|
| 35 |
+
<div class="max-w-7xl mx-auto px-4 sm:px-6 lg:px-8">
|
| 36 |
+
<div class="flex items-center justify-between h-16">
|
| 37 |
+
<a href="#" class="text-xl md:text-2xl font-bold text-white">Zero-Shot Audio Editing</a>
|
| 38 |
+
<div class="hidden md:flex space-x-6">
|
| 39 |
+
<a href="#supsamples" class="text-gray-200 hover:text-blue-300 transition">Text-based Editing</a>
|
| 40 |
+
<a href="#unsupsamples" class="text-gray-200 hover:text-blue-300 transition">Unsup. Editing</a>
|
| 41 |
+
<a href="#supcomparisons" class="text-gray-200 hover:text-blue-300 transition">Text-Based Editing Comp.</a>
|
| 42 |
+
<a href="#unsupcomparisons" class="text-gray-200 hover:text-blue-300 transition">Unsup. Editing Comp.</a>
|
| 43 |
+
</div>
|
| 44 |
+
<button id="mobile-menu-btn" class="md:hidden text-gray-200 text-2xl focus:outline-none">
|
| 45 |
+
<i class="fas fa-bars"></i>
|
| 46 |
+
</button>
|
| 47 |
+
</div>
|
| 48 |
+
<!-- Mobile Menu -->
|
| 49 |
+
<div id="mobile-menu" class="md:hidden hidden flex-col space-y-2 pb-4">
|
| 50 |
+
<a href="#supsamples" class="block text-gray-200 hover:text-blue-300">Text-based Editing</a>
|
| 51 |
+
<a href="#unsupsamples" class="block text-gray-200 hover:text-blue-300">Unsup. Editing</a>
|
| 52 |
+
<a href="#supcomparisons" class="block text-gray-200 hover:text-blue-300">Text-Based Editing Comp.</a>
|
| 53 |
+
<a href="#unsupcomparisons" class="block text-gray-200 hover:text-blue-300">Unsup. Editing Comp.</a>
|
| 54 |
+
</div>
|
| 55 |
</div>
|
| 56 |
+
</nav>
|
| 57 |
+
<main class="max-w-4xl mx-auto px-4 sm:px-6 lg:px-8">
|
| 58 |
+
<!-- Back to Top Button -->
|
| 59 |
+
<button onclick="window.scrollTo({top: 0, behavior: 'smooth'});" class="fixed bottom-8 right-8 bg-red-600 text-white rounded-full p-4 shadow-lg hover:bg-red-700 transition hidden md:block z-50" aria-label="Back to top" id="btn-back-to-top">
|
| 60 |
+
<i class="fas fa-arrow-up"></i>
|
| 61 |
+
</button>
|
| 62 |
+
<!-- Header Section -->
|
| 63 |
+
<section class="text-center py-10">
|
| 64 |
+
<h1 class="text-2xl sm:text-3xl md:text-4xl lg:text-5xl font-bold mb-4">Zero-Shot Unsupervised and Text-Based Audio Editing Using DDPM Inversion</h1>
|
| 65 |
+
<h4 class="text-lg sm:text-xl md:text-2xl mb-2">ICML 2024</h4>
|
| 66 |
+
<div class="flex flex-wrap justify-center gap-4 mt-4 text-base sm:text-lg">
|
| 67 |
+
<a href="https://www.linkedin.com/in/hilamanor/" target="_blank" class="hover:text-blue-400 transition">Hila Manor</a>
|
| 68 |
+
<span class="text-gray-400 hidden sm:inline">|</span>
|
| 69 |
+
<a href="https://tomer.net.technion.ac.il/" target="_blank" class="hover:text-blue-400 transition">Tomer Michaeli</a>
|
| 70 |
+
</div>
|
| 71 |
+
<p class="text-center text-base sm:text-lg mt-2">Technion - Israel Institute of Technology</p>
|
| 72 |
+
<div class="flex flex-wrap justify-center gap-3 mt-6">
|
| 73 |
+
<a class="px-4 py-2 rounded-lg border border-blue-400 text-blue-400 hover:bg-blue-500 hover:text-white transition flex items-center gap-2" href="https://arxiv.org/abs/2402.10009" target="_blank">
|
| 74 |
+
<i class="ai ai-arxiv"></i>ArXiv
|
| 75 |
+
</a>
|
| 76 |
+
<a class="px-4 py-2 rounded-lg border border-blue-400 text-blue-400 hover:bg-blue-500 hover:text-white transition flex items-center gap-2" href="https://github.com/HilaManor/AudioEditingCode/" target="_blank">
|
| 77 |
+
<i class="fab fa-github"></i>Code
|
| 78 |
+
</a>
|
| 79 |
+
<a class="px-4 py-2 rounded-lg border border-blue-400 text-blue-400 hover:bg-blue-500 hover:text-white transition flex items-center gap-2" href="https://youtu.be/lBnldOQVbS4" target="_blank">
|
| 80 |
+
<i class="fab fa-youtube"></i>Presentation
|
| 81 |
+
</a>
|
| 82 |
+
<a class="px-4 py-2 rounded-lg border border-blue-400 text-blue-400 hover:bg-blue-500 hover:text-white transition flex items-center gap-2" href="https://huggingface.co/spaces/hilamanor/audioEditing/" target="_blank">
|
| 83 |
+
🤗 Text-Based Space
|
| 84 |
+
</a>
|
| 85 |
+
</div>
|
| 86 |
+
</section>
|
| 87 |
+
<!-- Abstract and Teaser -->
|
| 88 |
+
<section class="text-center py-8">
|
| 89 |
+
<img alt="Teaser" src="https://github.com/HilaManor/AudioEditingCode/raw/refs/heads/codeclean/docs/resources/teaser.png" class="w-full max-w-lg mx-auto rounded-lg shadow-lg mb-6"/>
|
| 90 |
+
<h2 class="text-xl sm:text-2xl md:text-3xl font-semibold mb-2">Abstract</h2>
|
| 91 |
+
<p class="text-base sm:text-lg leading-relaxed mt-4 text-gray-200">
|
| 92 |
+
Editing signals using large pre-trained models, in a zero-shot manner, has recently seen rapid advancements in the image domain. However, this wave has yet to reach the audio domain.
|
| 93 |
+
In this paper, we explore two zero-shot editing techniques for audio signals, which use DDPM inversion on pre-trained diffusion models. The first, adopted from the image domain, allows text-based editing.
|
| 94 |
+
The second, is a novel approach for discovering semantically meaningful editing directions without supervision.
|
| 95 |
+
When applied to music signals, this method exposes a range of musically interesting modifications, from controlling the participation of specific instruments to improvisations on the melody.
|
| 96 |
+
</p>
|
| 97 |
+
</section>
|
| 98 |
+
<hr class="border-gray-700 my-8">
|
| 99 |
+
<!-- Video Overview -->
|
| 100 |
+
<section class="text-center py-8">
|
| 101 |
+
<h2 class="text-xl sm:text-2xl md:text-3xl font-semibold mb-2">Video Overview</h2>
|
| 102 |
+
<p class="text-base sm:text-lg mt-2 text-gray-300">For people in a hurry. Images generated by <a href="https://openai.com/dall-e-2" class="text-blue-400 hover:underline">DALL-E 2</a> and <a href="https://www.bing.com/copilot" class="text-blue-400 hover:underline">Copilot</a>.</p>
|
| 103 |
+
<video controls class="w-full max-w-md mx-auto rounded-lg shadow-lg mt-4">
|
| 104 |
+
<source src="https://github.com/HilaManor/AudioEditingCode/raw/refs/heads/codeclean/docs/resources/overview.mp4" type="video/mp4">
|
| 105 |
+
Your browser does not support the video tag.
|
| 106 |
+
</video>
|
| 107 |
+
</section>
|
| 108 |
+
<hr class="border-gray-700 my-8">
|
| 109 |
+
<!-- Samples of Editing -->
|
| 110 |
+
<section class="text-center py-8">
|
| 111 |
+
<h2 class="text-xl sm:text-2xl md:text-3xl font-semibold mb-2">1. Samples of Editing</h2>
|
| 112 |
+
<p class="text-base sm:text-lg mt-2 text-gray-300">We present samples of audio editing using our proposed methods. The samples are organized into two sections: text-based editing and unsupervised editing.</p>
|
| 113 |
+
<!-- Text-Based Editing Table -->
|
| 114 |
+
<h3 id="supsamples" class="text-lg sm:text-xl md:text-2xl font-semibold mt-6 mb-4">1.1. Samples of Text-Based Editing</h3>
|
| 115 |
+
<div class="overflow-x-auto">
|
| 116 |
+
<table class="min-w-full text-sm text-left text-gray-200 border border-gray-700 rounded-lg">
|
| 117 |
+
<thead class="bg-blue-900/80">
|
| 118 |
+
<tr>
|
| 119 |
+
<th class="px-2 py-2">#</th>
|
| 120 |
+
<th class="px-2 py-2">Source Prompt</th>
|
| 121 |
+
<th class="px-2 py-2">Target Prompt</th>
|
| 122 |
+
<th class="px-2 py-2">Original Audio</th>
|
| 123 |
+
<th class="px-2 py-2">Edited Audio</th>
|
| 124 |
+
<th class="px-2 py-2">Edit T<sub>start</sub></th>
|
| 125 |
+
</tr>
|
| 126 |
+
</thead>
|
| 127 |
+
<tbody>
|
| 128 |
+
<tr class="hover:bg-blue-800/30 transition">
|
| 129 |
+
<td class="px-2 py-2">1</td>
|
| 130 |
+
<td class="px-2 py-2">A recording of a <b>sneaky jazz</b> song.</td>
|
| 131 |
+
<td class="px-2 py-2">A recording of a <b>tense classical</b> music score.</td>
|
| 132 |
+
<td class="px-2 py-2"><audio controls class="w-32 sm:w-40 md:w-52"><source src="https://github.com/HilaManor/AudioEditingCode/raw/refs/heads/codeclean/docs/resources/audio/orig/MDDBFreeJazz.mp3" type="audio/mp4"></audio></td>
|
| 133 |
+
<td class="px-2 py-2"><audio controls class="w-32 sm:w-40 md:w-52"><source src="https://github.com/HilaManor/AudioEditingCode/raw/refs/heads/codeclean/docs/resources/audio/sup_samples/orchestra_MDDBFreeJazz_ours_90.mp3" type="audio/mp4"></audio></td>
|
| 134 |
+
<td class="px-2 py-2 text-center">110</td>
|
| 135 |
+
</tr>
|
| 136 |
+
<tr class="hover:bg-blue-800/30 transition">
|
| 137 |
+
<td class="px-2 py-2">2</td>
|
| 138 |
+
<td class="px-2 py-2">A recording of a <b>hard rock</b> song.</td>
|
| 139 |
+
<td class="px-2 py-2">A recording of a <b>jazz</b> song.</td>
|
| 140 |
+
<td class="px-2 py-2"><audio controls class="w-32 sm:w-40 md:w-52"><source src="https://github.com/HilaManor/AudioEditingCode/raw/refs/heads/codeclean/docs/resources/audio/orig/MDDBZeppelin.mp3" type="audio/mp4"></audio></td>
|
| 141 |
+
<td class="px-2 py-2"><audio controls class="w-32 sm:w-40 md:w-52"><source src="https://github.com/HilaManor/AudioEditingCode/raw/refs/heads/codeclean/docs/resources/audio/sup_samples/jazz_MDDBZeppelin_ours_100.mp3" type="audio/mp4"></audio></td>
|
| 142 |
+
<td class="px-2 py-2 text-center">100</td>
|
| 143 |
+
</tr>
|
| 144 |
+
<!-- Add more rows as needed -->
|
| 145 |
+
</tbody>
|
| 146 |
+
</table>
|
| 147 |
+
</div>
|
| 148 |
+
</section>
|
| 149 |
+
</main>
|
| 150 |
+
<script>
|
| 151 |
+
// Mobile menu toggle
|
| 152 |
+
const menuBtn = document.getElementById('mobile-menu-btn');
|
| 153 |
+
const menu = document.getElementById('mobile-menu');
|
| 154 |
+
menuBtn.addEventListener('click', () => {
|
| 155 |
+
menu.classList.toggle('hidden');
|
| 156 |
+
});
|
| 157 |
+
|
| 158 |
+
// Show back-to-top button on scroll
|
| 159 |
+
window.addEventListener('scroll', function() {
|
| 160 |
+
const btn = document.getElementById('btn-back-to-top');
|
| 161 |
+
if (window.scrollY > 300) {
|
| 162 |
+
btn.classList.remove('hidden');
|
| 163 |
+
} else {
|
| 164 |
+
btn.classList.add('hidden');
|
| 165 |
+
}
|
| 166 |
+
});
|
| 167 |
+
</script>
|
| 168 |
+
</body>
|
| 169 |
+
</html>
|