Spaces:
Runtime error
Runtime error
limit input length (#2)
Browse files- limit input length (e7fdc7d42ccb0fbdd26d56c42db931a377cfc85b)
- Update app.py (19a7ce50f59e767c97f0f9b445e8b4cfd3748b06)
app.py
CHANGED
|
@@ -71,15 +71,6 @@ def sample(ldm_stable, zs, wts, steps, prompt_tar, tstart, cfg_scale_tar): # ,
|
|
| 71 |
return f.name
|
| 72 |
|
| 73 |
|
| 74 |
-
# def change_tstart_range(t_start, steps):
|
| 75 |
-
# maximum = int(0.8 * steps)
|
| 76 |
-
# minimum = int(0.15 * steps)
|
| 77 |
-
# if t_start > maximum:
|
| 78 |
-
# t_start = maximum
|
| 79 |
-
# elif t_start < minimum:
|
| 80 |
-
# t_start = minimum
|
| 81 |
-
# return t_start
|
| 82 |
-
|
| 83 |
|
| 84 |
def edit(input_audio,
|
| 85 |
model_id: str,
|
|
@@ -93,13 +84,6 @@ def edit(input_audio,
|
|
| 93 |
t_start=45,
|
| 94 |
randomize_seed=True):
|
| 95 |
|
| 96 |
-
# global ldm_stable, current_loaded_model
|
| 97 |
-
# print(f'current loaded model: {ldm_stable.model_id}')
|
| 98 |
-
# if model_id != current_loaded_model:
|
| 99 |
-
# print(f'Changing model to {model_id}...')
|
| 100 |
-
# current_loaded_model = model_id
|
| 101 |
-
# ldm_stable = None
|
| 102 |
-
# ldm_stable = load_model(model_id, device)
|
| 103 |
print(model_id)
|
| 104 |
if model_id == LDM2:
|
| 105 |
ldm_stable = ldm2
|
|
@@ -219,7 +203,7 @@ with gr.Blocks(css='style.css') as demo:
|
|
| 219 |
do_inversion = gr.State(value=True) # To save some runtime when editing the same thing over and over
|
| 220 |
|
| 221 |
with gr.Row():
|
| 222 |
-
input_audio = gr.Audio(sources=["upload", "microphone"],
|
| 223 |
interactive=True, scale=1)
|
| 224 |
output_audio = gr.Audio(label="Edited Audio", interactive=False, scale=1)
|
| 225 |
|
|
|
|
| 71 |
return f.name
|
| 72 |
|
| 73 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 74 |
|
| 75 |
def edit(input_audio,
|
| 76 |
model_id: str,
|
|
|
|
| 84 |
t_start=45,
|
| 85 |
randomize_seed=True):
|
| 86 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 87 |
print(model_id)
|
| 88 |
if model_id == LDM2:
|
| 89 |
ldm_stable = ldm2
|
|
|
|
| 203 |
do_inversion = gr.State(value=True) # To save some runtime when editing the same thing over and over
|
| 204 |
|
| 205 |
with gr.Row():
|
| 206 |
+
input_audio = gr.Audio(sources=["upload", "microphone"], type="filepath", label="Input Audio",
|
| 207 |
interactive=True, scale=1)
|
| 208 |
output_audio = gr.Audio(label="Edited Audio", interactive=False, scale=1)
|
| 209 |
|
utils.py
CHANGED
|
@@ -16,7 +16,7 @@ def load_audio(audio_path: Union[str, np.array], fn_STFT, left: int = 0, right:
|
|
| 16 |
import audioldm
|
| 17 |
import audioldm.audio
|
| 18 |
|
| 19 |
-
duration = audioldm.utils.get_duration(audio_path)
|
| 20 |
|
| 21 |
mel, _, _ = audioldm.audio.wav_to_fbank(audio_path, target_length=int(duration * 102.4), fn_STFT=fn_STFT)
|
| 22 |
mel = mel.unsqueeze(0)
|
|
|
|
| 16 |
import audioldm
|
| 17 |
import audioldm.audio
|
| 18 |
|
| 19 |
+
duration = min(audioldm.utils.get_duration(audio_path), 15)
|
| 20 |
|
| 21 |
mel, _, _ = audioldm.audio.wav_to_fbank(audio_path, target_length=int(duration * 102.4), fn_STFT=fn_STFT)
|
| 22 |
mel = mel.unsqueeze(0)
|