Spaces:
Runtime error
Runtime error
| import yaml | |
| import argbind | |
| import audiotools as at | |
| from vampnet.interface import Interface | |
| import logging | |
| logger = logging.getLogger() | |
| logger.setLevel(logging.DEBUG) | |
| Interface = argbind.bind(Interface) | |
| with open("conf/interface/spotdl.yml") as f: | |
| conf = yaml.safe_load(f) | |
| with argbind.scope(conf): | |
| interface = Interface() | |
| interface.to("cuda") | |
| loader = at.data.datasets.AudioLoader(sources=[ | |
| "input.wav", | |
| ]) | |
| dataset = at.data.datasets.AudioDataset( | |
| loader, | |
| sample_rate=interface.codec.sample_rate, | |
| duration=interface.coarse.chunk_size_s, | |
| n_examples=200, | |
| without_replacement=True, | |
| ) | |
| import numpy as np | |
| def load_random_audio(): | |
| index = np.random.randint(0, len(dataset)) | |
| sig = dataset[index]["signal"] | |
| sig = interface.preprocess(sig) | |
| return sig | |
| sig = load_random_audio() | |
| z = interface.encode(sig) | |
| sig.write('input.wav') | |
| from vampnet import mask as pmask | |
| # build the mask | |
| mask = pmask.linear_random(z, 1.0) | |
| print("coarse") | |
| zv, mask_z = interface.coarse_vamp( | |
| z, | |
| mask=mask, | |
| sampling_steps=36, | |
| temperature=8.0, | |
| return_mask=True, | |
| typical_filtering=False, | |
| # typical_mass=data[typical_mass], | |
| # typical_min_tokens=data[typical_min_tokens], | |
| gen_fn=interface.coarse.generate, | |
| ) | |
| print("coarse2fine") | |
| zv = interface.coarse_to_fine(zv, temperature=0.8) | |
| sig = interface.to_signal(zv).cpu() | |
| sig.write('output-t=8.wav') |