for the researchers (fabccfd7) · Commits · school / Capstone Design / 01 / AudioLM

audiolm_pytorch/audiolm_pytorch.py

+9 −4

Original line number	Diff line number	Diff line
		@@ -1229,7 +1229,8 @@ class AudioLM(nn.Module):
		batch_size = 1,
		text: Optional[List[str]] = None,
		prime_wave = None,
		max_length = 2048
		max_length = 2048,
		return_coarse_generated_wave = False
		):
		if exists(prime_wave):
		prime_wave = prime_wave.to(self.device)
		@@ -1241,14 +1242,18 @@ class AudioLM(nn.Module):
		max_length = max_length
		)

		coarse_token_ids = self.coarse.generate(
		coarse_token_ids_or_recon_wave = self.coarse.generate(
		text = text,
		semantic_token_ids = semantic_token_ids
		semantic_token_ids = semantic_token_ids,
		reconstruct_wave = return_coarse_generated_wave
		)

		if return_coarse_generated_wave:
		return coarse_token_ids_or_recon_wave

		generated_wave = self.fine.generate(
		text = text,
		coarse_token_ids = coarse_token_ids,
		coarse_token_ids = coarse_token_ids_or_recon_wave,
		reconstruct_wave = True
		)

+1 −1

Original line number	Diff line number	Diff line
		@@ -3,7 +3,7 @@ from setuptools import setup, find_packages
		setup(
		name = 'audiolm-pytorch',
		packages = find_packages(exclude=[]),
		version = '0.0.43',
		version = '0.0.44',
		license='MIT',
		description = 'AudioLM - Language Modeling Approach to Audio Generation from Google Research - Pytorch',
		author = 'Phil Wang',