@wonwooo

Can you provide the training code for that model?
___
import torch

from naturalspeech2_pytorch import Trainer, EncodecWrapper, Model, NaturalSpeech2, SpeechPromptEncoder

codec = EncodecWrapper()

def main():
    model = Model(
        dim = 128,
        depth = 6,
        dim_prompt = 512,
        cond_drop_prob = 0.25,
        condition_on_prompt = True
    )

    diffusion = NaturalSpeech2(
        model = model,
        codec = codec,
        timesteps = 50
    )
    
    raw_audio = torch.randn(4, 327680)
    prompt = torch.randn(4, 32768)

    text = torch.randint(0, 100, (4, 100))
    text_lens = torch.tensor([100, 50 , 80, 100])

    # forwards and backwards

    loss = diffusion(
        audio = raw_audio,
        text = text,
        text_lens = text_lens,
        prompt = prompt,
        )

    loss.backward()

    # after much training

    generated_audio = diffusion.sample(
        length = 1024,
        text = text,
        prompt = prompt,
        )

    trainer = Trainer(
        diffusion_model = diffusion,
        folder = 'C:\\naturalspeech2-pytorch\\ansunghun',
        train_batch_size = 16,
        gradient_accumulate_every = 2,
        train_num_steps = 5,
        save_and_sample_every = 100,
    )

    trainer.train()
    trainer.save_checkpoint('C:\\naturalspeech2-pytorch\\ansunghun\\checkpoint.pt')
    
if __name__ == '__main__':
    from multiprocessing import freeze_support
    freeze_support()
    main()
___
An error occurs in that code.
___
Traceback (most recent call last):
  File "test.py", line 62, in <module>
    main()
  File "test.py", line 56, in main
    trainer.train()
  File "C:\naturalspeech2-pytorch\naturalspeech2_pytorch\naturalspeech2_pytorch.py", line 1875, in train
    loss = self.model(data)
  File "C:\Users\user\.conda\envs\svc\lib\site-packages\torch\nn\modules\module.py", line 1511, in _wrapped_call_impl
    return self._call_impl(*args, **kwargs)
  File "C:\Users\user\.conda\envs\svc\lib\site-packages\torch\nn\modules\module.py", line 1520, in _call_impl
    return forward_call(*args, **kwargs)
  File "C:\naturalspeech2-pytorch\naturalspeech2_pytorch\naturalspeech2_pytorch.py", line 1522, in forward
    text_max_length = text.shape[-1]
AttributeError: 'NoneType' object has no attribute 'shape'

Provide feedback

Saved searches

Use saved searches to filter your results more quickly

@wonwooo #37

Metadata

Assignees

Labels

Projects

Milestone

Relationships

Development

@wonwooo #37

Description

Metadata

Metadata

Assignees

Labels

Projects

Milestone

Relationships

Development

Issue actions