Loading audiolm_pytorch/audiolm_pytorch.py +9 −4 Original line number Diff line number Diff line Loading @@ -1229,7 +1229,8 @@ class AudioLM(nn.Module): batch_size = 1, text: Optional[List[str]] = None, prime_wave = None, max_length = 2048 max_length = 2048, return_coarse_generated_wave = False ): if exists(prime_wave): prime_wave = prime_wave.to(self.device) Loading @@ -1241,14 +1242,18 @@ class AudioLM(nn.Module): max_length = max_length ) coarse_token_ids = self.coarse.generate( coarse_token_ids_or_recon_wave = self.coarse.generate( text = text, semantic_token_ids = semantic_token_ids semantic_token_ids = semantic_token_ids, reconstruct_wave = return_coarse_generated_wave ) if return_coarse_generated_wave: return coarse_token_ids_or_recon_wave generated_wave = self.fine.generate( text = text, coarse_token_ids = coarse_token_ids, coarse_token_ids = coarse_token_ids_or_recon_wave, reconstruct_wave = True ) Loading setup.py +1 −1 Original line number Diff line number Diff line Loading @@ -3,7 +3,7 @@ from setuptools import setup, find_packages setup( name = 'audiolm-pytorch', packages = find_packages(exclude=[]), version = '0.0.43', version = '0.0.44', license='MIT', description = 'AudioLM - Language Modeling Approach to Audio Generation from Google Research - Pytorch', author = 'Phil Wang', Loading Loading
audiolm_pytorch/audiolm_pytorch.py +9 −4 Original line number Diff line number Diff line Loading @@ -1229,7 +1229,8 @@ class AudioLM(nn.Module): batch_size = 1, text: Optional[List[str]] = None, prime_wave = None, max_length = 2048 max_length = 2048, return_coarse_generated_wave = False ): if exists(prime_wave): prime_wave = prime_wave.to(self.device) Loading @@ -1241,14 +1242,18 @@ class AudioLM(nn.Module): max_length = max_length ) coarse_token_ids = self.coarse.generate( coarse_token_ids_or_recon_wave = self.coarse.generate( text = text, semantic_token_ids = semantic_token_ids semantic_token_ids = semantic_token_ids, reconstruct_wave = return_coarse_generated_wave ) if return_coarse_generated_wave: return coarse_token_ids_or_recon_wave generated_wave = self.fine.generate( text = text, coarse_token_ids = coarse_token_ids, coarse_token_ids = coarse_token_ids_or_recon_wave, reconstruct_wave = True ) Loading
setup.py +1 −1 Original line number Diff line number Diff line Loading @@ -3,7 +3,7 @@ from setuptools import setup, find_packages setup( name = 'audiolm-pytorch', packages = find_packages(exclude=[]), version = '0.0.43', version = '0.0.44', license='MIT', description = 'AudioLM - Language Modeling Approach to Audio Generation from Google Research - Pytorch', author = 'Phil Wang', Loading