Spaces:

chenxie95
/

MeanAudio

Running on Zero

App Files Files Community

AndreasXi commited on 20 days ago

Commit

bbd22e4

1 Parent(s): 079604c

add rlhf

Browse files

Files changed (1) hide show

app.py +22 -1

app.py CHANGED Viewed

@@ -147,7 +147,7 @@ def generate_audio_gradio(
     rng = torch.Generator(device=device)
     # force to 42
-    # rng.manual_seed(42)
     audios = generation_func(
         [prompt]*NUM_SAMPLE,
@@ -191,6 +191,27 @@ duration = gr.Slider(minimum=1, maximum=30, value=10, step=1, label="Duration",
 # seed = gr.Slider(minimum=1, maximum=1000000, value=42, step=1, label="Seed", interactive=True)
 variant = gr.Dropdown(label="Model Variant", choices=list(all_model_cfg.keys()), value='meanaudio_s_full', interactive=True)
 gr_interface = gr.Interface(
     fn=generate_audio_gradio,
     inputs=[input_text, duration, cfg_strength, denoising_steps, variant],

     rng = torch.Generator(device=device)
     # force to 42
+    rng.manual_seed(42)
     audios = generation_func(
         [prompt]*NUM_SAMPLE,
 # seed = gr.Slider(minimum=1, maximum=1000000, value=42, step=1, label="Seed", interactive=True)
 variant = gr.Dropdown(label="Model Variant", choices=list(all_model_cfg.keys()), value='meanaudio_s_full', interactive=True)
+description_text = """
+**MeanAudio** is a novel text-to-audio generator that uses **MeanFlow** to synthesize realistic and faithful audio in few sampling steps. It achieves state-of-the-art performance in single-step audio generation and delivers strong performance in multi-step audio generation.
+<div style="display: flex; gap: 10px; align-items: center;">
+    <a href="https://huggingface.co/AndreasXi/MeanAudio">
+    <img src="https://img.shields.io/badge/Model-HuggingFace-violet?logo=huggingface" alt="Hugging Face Model">
+    </a>
+    <a href="https://huggingface.co/spaces/chenxie95/MeanAudio">
+    <img src="https://img.shields.io/badge/Space-HuggingFace-8A2BE2?logo=huggingface" alt="Hugging Face Space">
+    </a>
+    <a href="https://meanaudio.github.io/">
+    <img src="https://img.shields.io/badge/Project-Page-brightred?style=flat" alt="Project Page">
+    </a>
+    <a href="https://github.com/xiquan-li/MeanAudio">
+    <img src="https://img.shields.io/badge/Code-GitHub-black?logo=github" alt="GitHub">
+    </a>
+</div>
+"""
 gr_interface = gr.Interface(
     fn=generate_audio_gradio,
     inputs=[input_text, duration, cfg_strength, denoising_steps, variant],