Spaces:

Nymbo
/

Tools

Running

App Files Files Community

Nymbo commited on 12 days ago

Commit

948d89f

verified ·

1 Parent(s): 0c8e311

adding all kokoro voices to MCP context, plus adds links to browse all image gen and viceo gen models available

Browse files

Files changed (1) hide show

app.py +17 -7

app.py CHANGED Viewed

@@ -1773,9 +1773,9 @@ kokoro_interface = gr.Interface(
     ),
     api_description=(
         "Synthesize speech from text using Kokoro-82M TTS model. Returns (sample_rate, waveform) suitable for playback. "
-        "Supports unlimited text length by processing all segments. Voice examples: 'af_heart' (US female), 'am_onyx' (US male), "
-        "'bf_emma' (British female), 'af_sky' (US female), 'af_nicole' (US female), "
-        "Parameters: text (str), speed (float 0.5–2.0, default 1.25x), voice (str from 54 available options, default 'af_heart'). "
         "Return the generated media to the user in this format `![Alt text](URL)`"
     ),
     flagging_mode="never",
@@ -1984,7 +1984,12 @@ image_generation_interface = gr.Interface(
     fn=Generate_Image,
     inputs=[
         gr.Textbox(label="Prompt", placeholder="Enter a prompt", lines=2),
-        gr.Textbox(label="Model", value="black-forest-labs/FLUX.1-Krea-dev", placeholder="creator/model-name"),
         gr.Textbox(
             label="Negative Prompt",
             value=(
@@ -2189,7 +2194,12 @@ video_generation_interface = gr.Interface(
     fn=Generate_Video,
     inputs=[
         gr.Textbox(label="Prompt", placeholder="Enter a prompt for the video", lines=2),
-    gr.Textbox(label="Model", value="Wan-AI/Wan2.2-T2V-A14B", placeholder="creator/model-name"),
         gr.Textbox(label="Negative Prompt", value="", lines=2),
         gr.Slider(minimum=1, maximum=100, value=25, step=1, label="Steps"),
         gr.Slider(minimum=1.0, maximum=20.0, value=3.5, step=0.1, label="CFG Scale"),
@@ -2202,8 +2212,8 @@ video_generation_interface = gr.Interface(
     outputs=gr.Video(label="Generated Video", show_download_button=True, format="mp4"),
     title="Generate Video",
     description=(
-    "<div style=\"text-align:center\">Generate short videos via Hugging Face serverless inference. "
-    "Default model is Wan2.2-T2V-A14B.</div>"
     ),
     api_description=(
         "Generate a short video from a text prompt using a Hugging Face model via serverless inference. "

     ),
     api_description=(
         "Synthesize speech from text using Kokoro-82M TTS model. Returns (sample_rate, waveform) suitable for playback. "
+        "Parameters: text (str), speed (float 0.5–2.0, default 1.25x), voice (str, default 'af_heart'). "
+        "Voice Legend: af=American female, am=American male, bf=British female, bm=British male, ef=European female, em=European male, hf=Hindi female, hm=Hindi male, if=Italian female, im=Italian male, jf=Japanese female, jm=Japanese male, pf=Portuguese female, pm=Portuguese male, zf=Chinese female, zm=Chinese male, ff=French female. "
+        "All Voices: af_alloy, af_aoede, af_bella, af_heart, af_jessica, af_kore, af_nicole, af_nova, af_river, af_sarah, af_sky, am_adam, am_echo, am_eric, am_fenrir, am_liam, am_michael, am_onyx, am_puck, am_santa, bf_alice, bf_emma, bf_isabella, bf_lily, bm_daniel, bm_fable, bm_george, bm_lewis, ef_dora, em_alex, em_santa, ff_siwis, hf_alpha, hf_beta, hm_omega, hm_psi, if_sara, im_nicola, jf_alpha, jf_gongitsune, jf_nezumi, jf_tebukuro, jm_kumo, pf_dora, pm_alex, pm_santa, zf_xiaobei, zf_xiaoni, zf_xiaoxiao, zf_xiaoyi, zm_yunjian, zm_yunxi, zm_yunxia, zm_yunyang. "
         "Return the generated media to the user in this format `![Alt text](URL)`"
     ),
     flagging_mode="never",
     fn=Generate_Image,
     inputs=[
         gr.Textbox(label="Prompt", placeholder="Enter a prompt", lines=2),
+        gr.Textbox(
+            label="Model",
+            value="black-forest-labs/FLUX.1-Krea-dev",
+            placeholder="creator/model-name",
+            info="<a href=\"https://huggingface.co/models?pipeline_tag=text-to-image&inference_provider=nebius,cerebras,novita,fireworks-ai,together,fal-ai,groq,featherless-ai,nscale,hyperbolic,sambanova,cohere,replicate,scaleway,publicai,hf-inference&sort=trending\" target=\"_blank\" rel=\"noopener noreferrer\">Browse models</a>",
+        ),
         gr.Textbox(
             label="Negative Prompt",
             value=(
     fn=Generate_Video,
     inputs=[
         gr.Textbox(label="Prompt", placeholder="Enter a prompt for the video", lines=2),
+        gr.Textbox(
+            label="Model",
+            value="Wan-AI/Wan2.2-T2V-A14B",
+            placeholder="creator/model-name",
+            info="<a href=\"https://huggingface.co/models?pipeline_tag=text-to-video&inference_provider=nebius,cerebras,novita,fireworks-ai,together,fal-ai,groq,featherless-ai,nscale,hyperbolic,sambanova,cohere,replicate,scaleway,publicai,hf-inference&sort=trending\" target=\"_blank\" rel=\"noopener noreferrer\">Browse models</a>",
+        ),
         gr.Textbox(label="Negative Prompt", value="", lines=2),
         gr.Slider(minimum=1, maximum=100, value=25, step=1, label="Steps"),
         gr.Slider(minimum=1.0, maximum=20.0, value=3.5, step=0.1, label="CFG Scale"),
     outputs=gr.Video(label="Generated Video", show_download_button=True, format="mp4"),
     title="Generate Video",
     description=(
+        "<div style=\"text-align:center\">Generate short videos via Hugging Face serverless inference. "
+        "Default model is Wan2.2-T2V-A14B.</div>"
     ),
     api_description=(
         "Generate a short video from a text prompt using a Hugging Face model via serverless inference. "