Loading audiolm_pytorch/soundstream.py +6 −1 Original line number Diff line number Diff line Loading @@ -355,7 +355,12 @@ class SoundStream(nn.Module): self.load_state_dict(torch.load(str(path))) def non_discr_parameters(self): return [*self.encoder.parameters(), *self.decoder.parameters()] return [ *self.encoder.parameters(), *self.decoder.parameters(), *self.encoder_attn.parameters(), *self.decoder_attn.parameters() ] @property def seq_len_multiple_of(self): Loading audiolm_pytorch/trainer.py +2 −1 Original line number Diff line number Diff line Loading @@ -319,6 +319,8 @@ class SoundStreamTrainer(nn.Module): # update discriminator self.discr_optim.zero_grad() for _ in range(self.grad_accum_every): wave, = next(self.dl_iter) wave = wave.to(device) Loading @@ -340,7 +342,6 @@ class SoundStreamTrainer(nn.Module): # gradient step for all discriminators self.discr_optim.step() self.discr_optim.zero_grad() for ind in range(len(self.soundstream.discriminators)): discr_optimizer = getattr(self, f'multiscale_discr_optimizer_{ind}') Loading setup.py +1 −1 Original line number Diff line number Diff line Loading @@ -3,7 +3,7 @@ from setuptools import setup, find_packages setup( name = 'audiolm-pytorch', packages = find_packages(exclude=[]), version = '0.3.5', version = '0.3.6', license='MIT', description = 'AudioLM - Language Modeling Approach to Audio Generation from Google Research - Pytorch', author = 'Phil Wang', Loading Loading
audiolm_pytorch/soundstream.py +6 −1 Original line number Diff line number Diff line Loading @@ -355,7 +355,12 @@ class SoundStream(nn.Module): self.load_state_dict(torch.load(str(path))) def non_discr_parameters(self): return [*self.encoder.parameters(), *self.decoder.parameters()] return [ *self.encoder.parameters(), *self.decoder.parameters(), *self.encoder_attn.parameters(), *self.decoder_attn.parameters() ] @property def seq_len_multiple_of(self): Loading
audiolm_pytorch/trainer.py +2 −1 Original line number Diff line number Diff line Loading @@ -319,6 +319,8 @@ class SoundStreamTrainer(nn.Module): # update discriminator self.discr_optim.zero_grad() for _ in range(self.grad_accum_every): wave, = next(self.dl_iter) wave = wave.to(device) Loading @@ -340,7 +342,6 @@ class SoundStreamTrainer(nn.Module): # gradient step for all discriminators self.discr_optim.step() self.discr_optim.zero_grad() for ind in range(len(self.soundstream.discriminators)): discr_optimizer = getattr(self, f'multiscale_discr_optimizer_{ind}') Loading
setup.py +1 −1 Original line number Diff line number Diff line Loading @@ -3,7 +3,7 @@ from setuptools import setup, find_packages setup( name = 'audiolm-pytorch', packages = find_packages(exclude=[]), version = '0.3.5', version = '0.3.6', license='MIT', description = 'AudioLM - Language Modeling Approach to Audio Generation from Google Research - Pytorch', author = 'Phil Wang', Loading