Spaces:
Running
on
Zero
Running
on
Zero
File size: 1,427 Bytes
9172422 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 |
import torch
import pandas as pd
from stable_audio_tools import get_pretrained_model
import json
from stable_audio_tools.interface.generate_augs import generate_aug_one_sample, load_model
# import generate_aug_one_sample, load_model
model_config_path = '/fs/nexus-projects/brain_project/aaai_2025/stable-audio-tools/mod_config.json'
ckpt_path = '/fs/nexus-projects/brain_project/aaai_2025/stable-audio-tools/sonal_ft.safetensors'
pretrained_name = None
pretransform_ckpt_path = None
model_half=False
device = torch.device("cuda")
df = pd.read_csv('/fs/nexus-projects/brain_project/aaai_2025/stable-audio-tools/dummy.csv')
if model_config_path is not None:
# Load config from json file
with open(model_config_path) as f:
model_config = json.load(f)
for i, row in df.iterrows():
caption = row['caption']
duration = float(row['duration'])
output_path = row['output_path']
_, model_config = load_model(model_config, ckpt_path, pretrained_name=pretrained_name, pretransform_ckpt_path=pretransform_ckpt_path, model_half=model_half, device=device)
generate_aug_one_sample(model_config, duration, caption, steps=250, inpainting=False, init_audio=None, init_noise_level=80.0, output_file_name=output_path)
# caption,duration,output_path
# 'sound of a beep',2.0,'/fs/nexus-projects/brain_project/aaai_2025/stable-audio-tools/stable_audio_tools/interface/output_sakshi/beep.wav' |