sonalkum's picture
stable
9172422
raw
history blame
1.43 kB
import torch
import pandas as pd
from stable_audio_tools import get_pretrained_model
import json
from stable_audio_tools.interface.generate_augs import generate_aug_one_sample, load_model
# import generate_aug_one_sample, load_model
model_config_path = '/fs/nexus-projects/brain_project/aaai_2025/stable-audio-tools/mod_config.json'
ckpt_path = '/fs/nexus-projects/brain_project/aaai_2025/stable-audio-tools/sonal_ft.safetensors'
pretrained_name = None
pretransform_ckpt_path = None
model_half=False
device = torch.device("cuda")
df = pd.read_csv('/fs/nexus-projects/brain_project/aaai_2025/stable-audio-tools/dummy.csv')
if model_config_path is not None:
# Load config from json file
with open(model_config_path) as f:
model_config = json.load(f)
for i, row in df.iterrows():
caption = row['caption']
duration = float(row['duration'])
output_path = row['output_path']
_, model_config = load_model(model_config, ckpt_path, pretrained_name=pretrained_name, pretransform_ckpt_path=pretransform_ckpt_path, model_half=model_half, device=device)
generate_aug_one_sample(model_config, duration, caption, steps=250, inpainting=False, init_audio=None, init_noise_level=80.0, output_file_name=output_path)
# caption,duration,output_path
# 'sound of a beep',2.0,'/fs/nexus-projects/brain_project/aaai_2025/stable-audio-tools/stable_audio_tools/interface/output_sakshi/beep.wav'