| | import torchaudio |
| | from audiocraft.models import AudioGen |
| | from audiocraft.data.audio import audio_write |
| |
|
| | model = AudioGen.get_pretrained('facebook/audiogen-medium') |
| | model.set_generation_params(duration=5) |
| | wav = model.generate_unconditional(4) |
| | descriptions = ['dog barking', 'sirenes of an emergency vehicule', 'footsteps in a corridor'] |
| | wav = model.generate(descriptions) |
| |
|
| | for idx, one_wav in enumerate(wav): |
| | |
| | audio_write(f'{idx}', one_wav.cpu(), model.sample_rate, strategy="loudness", loudness_compressor=True) |
| |
|