| import random |
| import vampnet |
| import audiotools as at |
|
|
| |
| interface = vampnet.interface.Interface.default() |
|
|
| |
| finetuned_model_choices = interface.available_models() |
| print(f"available finetuned models: {finetuned_model_choices}") |
|
|
| |
| model_choice = random.choice(finetuned_model_choices) |
| print(f"choosing model: {model_choice}") |
|
|
| |
| print(f"actually, forcing model: default") |
| model_choice = "default" |
|
|
| |
| interface.load_finetuned(model_choice) |
|
|
| |
| signal = at.AudioSignal("assets/example.wav") |
|
|
| |
| codes = interface.encode(signal) |
|
|
| |
| mask = interface.build_mask( |
| codes, signal, |
| periodic_prompt=13, |
| upper_codebook_mask=3, |
| ) |
|
|
| |
| output_tokens = interface.vamp( |
| codes, mask, return_mask=False, |
| temperature=1.0, |
| typical_filtering=False, |
| debug=True |
| ) |
|
|
| |
| output_signal = interface.decode(output_tokens) |
|
|
| |
| output_signal.write("scratch/output.wav") |