An advanced singing voice synthesis system with high fidelity, expressiveness, controllability and flexibility based on DiffSinger: Singing Voice Synthesis via Shallow Diffusion Mechanism
Traceback (most recent call last):
File "/home/linjl/diffsinger-Reflow/DiffSinger-RectifiedFlow/scripts/train.py", line 31, in <module>
run_task()
File "/home/linjl/diffsinger-Reflow/DiffSinger-RectifiedFlow/scripts/train.py", line 27, in run_task
task_cls.start()
File "/home/linjl/diffsinger-Reflow/DiffSinger-RectifiedFlow/basics/base_task.py", line 467, in start
trainer.fit(task, ckpt_path=get_latest_checkpoint_path(work_dir))
File "/home/linjl/anaconda3/envs/diffv2-2/lib/python3.10/site-packages/lightning/pytorch/trainer/trainer.py", line 520, in fit
call._call_and_handle_interrupt(
File "/home/linjl/anaconda3/envs/diffv2-2/lib/python3.10/site-packages/lightning/pytorch/trainer/call.py", line 44, in _call_and_handle_interrupt
return trainer_fn(*args, **kwargs)
File "/home/linjl/anaconda3/envs/diffv2-2/lib/python3.10/site-packages/lightning/pytorch/trainer/trainer.py", line 559, in _fit_impl
self._run(model, ckpt_path=ckpt_path)
File "/home/linjl/anaconda3/envs/diffv2-2/lib/python3.10/site-packages/lightning/pytorch/trainer/trainer.py", line 935, in _run
results = self._run_stage()
File "/home/linjl/anaconda3/envs/diffv2-2/lib/python3.10/site-packages/lightning/pytorch/trainer/trainer.py", line 976, in _run_stage
self._run_sanity_check()
File "/home/linjl/anaconda3/envs/diffv2-2/lib/python3.10/site-packages/lightning/pytorch/trainer/trainer.py", line 1005, in _run_sanity_check
val_loop.run()
File "/home/linjl/anaconda3/envs/diffv2-2/lib/python3.10/site-packages/lightning/pytorch/loops/utilities.py", line 177, in _decorator
return loop_run(self, *args, **kwargs)
File "/home/linjl/anaconda3/envs/diffv2-2/lib/python3.10/site-packages/lightning/pytorch/loops/evaluation_loop.py", line 115, in run
self._evaluation_step(batch, batch_idx, dataloader_idx)
File "/home/linjl/anaconda3/envs/diffv2-2/lib/python3.10/site-packages/lightning/pytorch/loops/evaluation_loop.py", line 375, in _evaluation_step
output = call._call_strategy_hook(trainer, hook_name, *step_kwargs.values())
File "/home/linjl/anaconda3/envs/diffv2-2/lib/python3.10/site-packages/lightning/pytorch/trainer/call.py", line 288, in _call_strategy_hook
output = fn(*args, **kwargs)
File "/home/linjl/anaconda3/envs/diffv2-2/lib/python3.10/site-packages/lightning/pytorch/strategies/strategy.py", line 378, in validation_step
return self.model.validation_step(*args, **kwargs)
File "/home/linjl/diffsinger-Reflow/DiffSinger-RectifiedFlow/basics/base_task.py", line 272, in validation_step
losses, weight = self._validation_step(sample, batch_idx)
File "/home/linjl/diffsinger-Reflow/DiffSinger-RectifiedFlow/training/acoustic_task.py", line 158, in _validation_step
mel_out: ShallowDiffusionOutput = self.run_model(sample, infer=True)
File "/home/linjl/diffsinger-Reflow/DiffSinger-RectifiedFlow/training/acoustic_task.py", line 122, in run_model
output: ShallowDiffusionOutput = self.model(
File "/home/linjl/anaconda3/envs/diffv2-2/lib/python3.10/site-packages/torch/nn/modules/module.py", line 1511, in _wrapped_call_impl
return self._call_impl(*args, **kwargs)
File "/home/linjl/anaconda3/envs/diffv2-2/lib/python3.10/site-packages/torch/nn/modules/module.py", line 1520, in _call_impl
return forward_call(*args, **kwargs)
File "/home/linjl/diffsinger-Reflow/DiffSinger-RectifiedFlow/modules/toplevel.py", line 105, in forward
mel_pred = self.diffusion(condition, src_spec=src_mel, infer=True)
File "/home/linjl/anaconda3/envs/diffv2-2/lib/python3.10/site-packages/torch/nn/modules/module.py", line 1511, in _wrapped_call_impl
return self._call_impl(*args, **kwargs)
File "/home/linjl/anaconda3/envs/diffv2-2/lib/python3.10/site-packages/torch/nn/modules/module.py", line 1520, in _call_impl
return forward_call(*args, **kwargs)
File "/home/linjl/diffsinger-Reflow/DiffSinger-RectifiedFlow/modules/diffusion/RectifiedFlow.py", line 91, in forward
x = self.inference(cond, b=b, x_start=spec, device=device)
File "/home/linjl/anaconda3/envs/diffv2-2/lib/python3.10/site-packages/torch/utils/_contextlib.py", line 115, in decorate_context
return func(*args, **kwargs)
File "/home/linjl/diffsinger-Reflow/DiffSinger-RectifiedFlow/modules/diffusion/RectifiedFlow.py", line 222, in inference
x, _ = algorithm_fn(x,t_start+ i*dt, dt, cond, model_fn=self.denoise_fn)
File "/home/linjl/anaconda3/envs/diffv2-2/lib/python3.10/site-packages/torch/utils/_contextlib.py", line 115, in decorate_context
return func(*args, **kwargs)
File "/home/linjl/diffsinger-Reflow/DiffSinger-RectifiedFlow/modules/diffusion/RectifiedFlow.py", line 102, in sample_rk4
k_1 = model_fn(x, self.timesteps * t, cond)
File "/home/linjl/anaconda3/envs/diffv2-2/lib/python3.10/site-packages/torch/nn/modules/module.py", line 1511, in _wrapped_call_impl
return self._call_impl(*args, **kwargs)
File "/home/linjl/anaconda3/envs/diffv2-2/lib/python3.10/site-packages/torch/nn/modules/module.py", line 1520, in _call_impl
return forward_call(*args, **kwargs)
File "/home/linjl/diffsinger-Reflow/DiffSinger-RectifiedFlow/modules/diffusion/wavenet.py", line 103, in forward
diffusion_step = self.diffusion_embedding(diffusion_step)
File "/home/linjl/anaconda3/envs/diffv2-2/lib/python3.10/site-packages/torch/nn/modules/module.py", line 1511, in _wrapped_call_impl
return self._call_impl(*args, **kwargs)
File "/home/linjl/anaconda3/envs/diffv2-2/lib/python3.10/site-packages/torch/nn/modules/module.py", line 1520, in _call_impl
return forward_call(*args, **kwargs)
File "/home/linjl/diffsinger-Reflow/DiffSinger-RectifiedFlow/modules/diffusion/wavenet.py", line 23, in forward
device = x.device
AttributeError: 'float' object has no attribute 'device'
python ver: 3.10.13 torch ver: 2.2.2+cu121 (Now) / 1.13.1+cu117 (Before) traceback:
acoustic config: