Spaces:
Running
on
Zero
Running
on
Zero
Nithya
commited on
Commit
·
d607f42
1
Parent(s):
8505dc9
added examples
Browse files- .gitattributes +1 -0
- app.py +34 -2
- examples/ex1-hf.wav +3 -0
- examples/ex2-hf.wav +3 -0
- examples/ex3-hf.wav +3 -0
- examples/ex4-hf.wav +3 -0
- examples/ex5-hf.wav +3 -0
.gitattributes
CHANGED
|
@@ -4,3 +4,4 @@ models/diffusion_pitch/last.ckpt filter=lfs diff=lfs merge=lfs -text
|
|
| 4 |
models/pitch_to_audio/last.ckpt filter=lfs diff=lfs merge=lfs -text
|
| 5 |
models/diffusion_pitch/qt.joblib filter=lfs diff=lfs merge=lfs -text
|
| 6 |
models/pitch_to_audio/qt.joblib filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
| 4 |
models/pitch_to_audio/last.ckpt filter=lfs diff=lfs merge=lfs -text
|
| 5 |
models/diffusion_pitch/qt.joblib filter=lfs diff=lfs merge=lfs -text
|
| 6 |
models/pitch_to_audio/qt.joblib filter=lfs diff=lfs merge=lfs -text
|
| 7 |
+
examples/** filter=lfs diff=lfs merge=lfs -text
|
app.py
CHANGED
|
@@ -195,14 +195,46 @@ def set_guide_and_generate(audio):
|
|
| 195 |
return audio, user_input_plot, pitch
|
| 196 |
|
| 197 |
with gr.Blocks() as demo:
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 198 |
with gr.Row():
|
| 199 |
with gr.Column():
|
| 200 |
audio = gr.Audio(label="Input")
|
| 201 |
sbmt = gr.Button()
|
| 202 |
-
|
|
|
|
| 203 |
with gr.Column():
|
| 204 |
generated_audio = gr.Audio(label="Generated Audio")
|
| 205 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 206 |
sbmt.click(set_guide_and_generate, inputs=[audio], outputs=[generated_audio, user_input, generated_pitch])
|
| 207 |
|
| 208 |
def main(argv):
|
|
|
|
| 195 |
return audio, user_input_plot, pitch
|
| 196 |
|
| 197 |
with gr.Blocks() as demo:
|
| 198 |
+
with gr.Column():
|
| 199 |
+
gr.Markdown("""
|
| 200 |
+
# GaMaDHaNi: HIERARCHICAL GENERATIVE MODELING OF MELODIC VOCAL CONTOURS IN HINDUSTANI CLASSICAL MUSIC
|
| 201 |
+
:book: Read more about the project [here](https://arxiv.org/pdf/2408.12658) <br>
|
| 202 |
+
:samples: Listen to the samples [here](https://snnithya.github.io/gamadhani-samples) <br>
|
| 203 |
+
# """)
|
| 204 |
+
gr.Markdown("""
|
| 205 |
+
## Instructions
|
| 206 |
+
In this demo you can interact with the model in two ways:
|
| 207 |
+
1. **Call and response**: The model will try to continue the idea that you input. This is similar to `primed generation' discussed in the paper.
|
| 208 |
+
2. **Melodic reinterpretation**: Akin to the idea of `coarse pitch conditioning' presented in the paper, you can input a pitch contour and the model will generate audio that is similar to but not exactly the same. <br><br>
|
| 209 |
+
**Upload an audio file or record your voice to get started!**
|
| 210 |
+
""")
|
| 211 |
+
gr.Markdown("""
|
| 212 |
+
This is still a work in progress, so please feel free to share any weird or interesting examples, we would love to hear them! Contact us at [snnithya.mit.edu](mailto:snnithya.mit.edu).
|
| 213 |
+
""")
|
| 214 |
+
|
| 215 |
with gr.Row():
|
| 216 |
with gr.Column():
|
| 217 |
audio = gr.Audio(label="Input")
|
| 218 |
sbmt = gr.Button()
|
| 219 |
+
with gr.Accordion("View Pitch Plot"):
|
| 220 |
+
user_input = gr.Plot(label="User Input")
|
| 221 |
with gr.Column():
|
| 222 |
generated_audio = gr.Audio(label="Generated Audio")
|
| 223 |
+
with gr.Accordion("View Pitch Plot"):
|
| 224 |
+
generated_pitch = gr.Plot(label="Generated Pitch")
|
| 225 |
+
example_description = gr.Textbox(label="Example Description", interactive=False)
|
| 226 |
+
examples = gr.Examples(
|
| 227 |
+
examples=[
|
| 228 |
+
["examples/ex1.wav"],
|
| 229 |
+
["examples/ex2.wav"],
|
| 230 |
+
["examples/ex3.wav"],
|
| 231 |
+
["examples/ex4.wav"],
|
| 232 |
+
["examples/ex5.wav"]
|
| 233 |
+
# Add more examples as needed
|
| 234 |
+
],
|
| 235 |
+
inputs=audio
|
| 236 |
+
)
|
| 237 |
+
|
| 238 |
sbmt.click(set_guide_and_generate, inputs=[audio], outputs=[generated_audio, user_input, generated_pitch])
|
| 239 |
|
| 240 |
def main(argv):
|
examples/ex1-hf.wav
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:30ae54c7e54036729d69fe70bfb294d1b80e445ad917df40bb293dfd88e7b21a
|
| 3 |
+
size 307406
|
examples/ex2-hf.wav
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9705358da218e84a8879b31ff30ee4a692706b6a5b6f76a9fdb21075300e3e43
|
| 3 |
+
size 265080
|
examples/ex3-hf.wav
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e816747fc71742ac1a4897ff7eebc3a7214c5d23a3c1b291f6d96e0630b82a9d
|
| 3 |
+
size 159868
|
examples/ex4-hf.wav
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0178c8ca78f6ae4bcd312f3f5c005dabfd1cb1f1520802872a4cd0507fa5878d
|
| 3 |
+
size 291182
|
examples/ex5-hf.wav
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e65935858bd0f9a8665d90929d69b8f2fcd6a5f52f079f41542c57426c8b4ace
|
| 3 |
+
size 128950
|