Skip to content

Getting error in AI_Auto_Cover_V1.ipynb - Обработка исходного аудио #2

@omkarpawar2001

Description

@omkarpawar2001

/content/MVSEP-MDX23-Colab_v2
GPU use: 0
started!

Options:
BigShifts: 7

weight_InstVoc: 8.0
weight_VitLarge: 5.0

overlap_InstVoc: 1
overlap_VitLarge: 1

use_VOCFT: False
vocals_only: True
output_format: PCM_16

Loading InstVoc into memory
100% 427M/427M [00:01<00:00, 287MB/s]
100% 709/709 [00:00<00:00, 3.24MB/s]
Loading VitLarge into memory
100% 824M/824M [00:04<00:00, 209MB/s]
100% 1.21k/1.21k [00:00<00:00, 4.60MB/s]
model.safetensors: 100% 850M/850M [00:10<00:00, 84.1MB/s]
Go for: /content/input/audio.mp3
Input audio: (2, 9353217) Sample rate: 44100
Processing vocals with VitLarge model...
0% 0/7 [00:00<?, ?it/s]
2
0% 0/7 [07:07<?, ?it/s]
Traceback (most recent call last):
File "/content/MVSEP-MDX23-Colab_v2/inference.py", line 816, in
predict_with_model(options)
File "/content/MVSEP-MDX23-Colab_v2/inference.py", line 715, in predict_with_model
result, sample_rates = model.separate_music_file(audio.T, sr, i, len(options['input_audio']))
File "/content/MVSEP-MDX23-Colab_v2/inference.py", line 525, in separate_music_file
vocals4, instrum4 = demix_full_vitlarge(audio, self.device, self.model_vl)
File "/content/MVSEP-MDX23-Colab_v2/inference.py", line 311, in demix_full_vitlarge
sources = demix_vitlarge(model, shifted_mix, device)
File "/content/MVSEP-MDX23-Colab_v2/inference.py", line 286, in demix_vitlarge
x = model(part.unsqueeze(0))[0]
File "/usr/local/lib/python3.10/dist-packages/torch/nn/modules/module.py", line 1518, in _wrapped_call_impl
return self._call_impl(*args, **kwargs)
File "/usr/local/lib/python3.10/dist-packages/torch/nn/modules/module.py", line 1527, in _call_impl
return forward_call(*args, **kwargs)
File "/content/MVSEP-MDX23-Colab_v2/modules/segm_models.py", line 135, in forward
x = self.unet_model(x)
File "/usr/local/lib/python3.10/dist-packages/torch/nn/modules/module.py", line 1518, in _wrapped_call_impl
return self._call_impl(*args, **kwargs)
File "/usr/local/lib/python3.10/dist-packages/torch/nn/modules/module.py", line 1527, in _call_impl
return forward_call(*args, **kwargs)
File "/usr/local/lib/python3.10/dist-packages/segmentation_models_pytorch/base/model.py", line 29, in forward
features = self.encoder(x)
File "/usr/local/lib/python3.10/dist-packages/torch/nn/modules/module.py", line 1518, in _wrapped_call_impl
return self._call_impl(*args, **kwargs)
File "/usr/local/lib/python3.10/dist-packages/torch/nn/modules/module.py", line 1527, in _call_impl
return forward_call(*args, **kwargs)
File "/usr/local/lib/python3.10/dist-packages/segmentation_models_pytorch/encoders/timm_universal.py", line 30, in forward
features = self.model(x)
File "/usr/local/lib/python3.10/dist-packages/torch/nn/modules/module.py", line 1518, in _wrapped_call_impl
return self._call_impl(*args, **kwargs)
File "/usr/local/lib/python3.10/dist-packages/torch/nn/modules/module.py", line 1527, in _call_impl
return forward_call(*args, **kwargs)
File "/usr/local/lib/python3.10/dist-packages/timm/models/_features.py", line 281, in forward
return list(self._collect(x).values())
File "/usr/local/lib/python3.10/dist-packages/timm/models/_features.py", line 235, in _collect
x = module(x)
File "/usr/local/lib/python3.10/dist-packages/torch/nn/modules/module.py", line 1518, in _wrapped_call_impl
return self._call_impl(*args, **kwargs)
File "/usr/local/lib/python3.10/dist-packages/torch/nn/modules/module.py", line 1527, in _call_impl
return forward_call(*args, **kwargs)
File "/usr/local/lib/python3.10/dist-packages/timm/models/maxxvit.py", line 1064, in forward
x = self.blocks(x)
File "/usr/local/lib/python3.10/dist-packages/torch/nn/modules/module.py", line 1518, in _wrapped_call_impl
return self._call_impl(*args, **kwargs)
File "/usr/local/lib/python3.10/dist-packages/torch/nn/modules/module.py", line 1527, in _call_impl
return forward_call(*args, **kwargs)
File "/usr/local/lib/python3.10/dist-packages/torch/nn/modules/container.py", line 215, in forward
input = module(input)
File "/usr/local/lib/python3.10/dist-packages/torch/nn/modules/module.py", line 1518, in _wrapped_call_impl
return self._call_impl(*args, **kwargs)
File "/usr/local/lib/python3.10/dist-packages/torch/nn/modules/module.py", line 1527, in _call_impl
return forward_call(*args, **kwargs)
File "/usr/local/lib/python3.10/dist-packages/timm/models/maxxvit.py", line 949, in forward
x = self.conv(x)
File "/usr/local/lib/python3.10/dist-packages/torch/nn/modules/module.py", line 1518, in _wrapped_call_impl
return self._call_impl(*args, **kwargs)
File "/usr/local/lib/python3.10/dist-packages/torch/nn/modules/module.py", line 1527, in _call_impl
return forward_call(*args, **kwargs)
File "/usr/local/lib/python3.10/dist-packages/timm/models/maxxvit.py", line 542, in forward
x = self.conv2_kxk(x)
File "/usr/local/lib/python3.10/dist-packages/torch/nn/modules/module.py", line 1518, in _wrapped_call_impl
return self._call_impl(*args, **kwargs)
File "/usr/local/lib/python3.10/dist-packages/torch/nn/modules/module.py", line 1527, in _call_impl
return forward_call(*args, **kwargs)
File "/usr/local/lib/python3.10/dist-packages/torch/nn/modules/conv.py", line 460, in forward
return self._conv_forward(input, self.weight, self.bias)
File "/usr/local/lib/python3.10/dist-packages/torch/nn/modules/conv.py", line 456, in _conv_forward
return F.conv2d(input, weight, bias, self.stride,
KeyboardInterrupt

Послушаем разделённый трек.
Нужно немного подождать, сейчас появится...
Вокал:


ValueError Traceback (most recent call last)

in <cell line: 53>()
51 get_ipython().system('ffmpeg -y -i {INSTRUM_FILE} -vn -ar 44100 -ac 2 -b:a 192k {os.path.join(OUTPUT_UVR_FOLDER, INPUT_NAME + "_instrum")}.mp3 &> /dev/null')
52 print("Вокал:")
---> 53 audio_vocal = Audio(os.path.join(OUTPUT_UVR_FOLDER, INPUT_NAME + "_vocals.mp3"), autoplay=False)
54 display(audio_vocal)
55 print("Инструментал:")

/usr/local/lib/python3.10/dist-packages/IPython/lib/display.py in init(self, data, filename, url, embed, rate, autoplay, normalize, element_id)
114 if self.data is not None and not isinstance(self.data, bytes):
115 if rate is None:
--> 116 raise ValueError("rate must be specified when data is a numpy array or list of audio samples.")
117 self.data = Audio._make_wav(data, rate, normalize)
118

ValueError: rate must be specified when data is a numpy array or list of audio samples.

Metadata

Metadata

Assignees

No one assigned

    Labels

    No labels
    No labels

    Projects

    No projects

    Milestone

    No milestone

    Relationships

    None yet

    Development

    No branches or pull requests

    Issue actions