This project is archived. Its data is read-only.

Commit 2ebe3541 authored Feb 02, 2023 by Phil Wang

fix

parent 49cc3923

audiolm_pytorch/audiolm_pytorch.py

+2 −2

Original line number	Diff line number	Diff line
		@@ -592,7 +592,7 @@ class CoarseTransformer(nn.Module):
		codebook_size_with_eos = codebook_size + 1
		self.coarse_embedding = nn.Embedding(num_coarse_quantizers * codebook_size_with_eos, dim)

		text_dim = get_encoded_dim(t5_name)
		text_dim = default(cond_dim, get_encoded_dim(t5_name))
		self.proj_text_embed = nn.Linear(text_dim, dim, bias = False) if text_dim != dim else nn.Identity()

		self.transformer = Transformer(
		@@ -767,7 +767,7 @@ class FineTransformer(nn.Module):

		self.eos_id = codebook_size

		text_dim = get_encoded_dim(t5_name)
		text_dim = default(cond_dim, get_encoded_dim(t5_name))
		self.proj_text_embed = nn.Linear(text_dim, dim, bias = False) if text_dim != dim else nn.Identity()

		self.transformer = Transformer(

setup.py

+1 −1

Original line number	Diff line number	Diff line
		@@ -3,7 +3,7 @@ from setuptools import setup, find_packages
		setup(
		name = 'audiolm-pytorch',
		packages = find_packages(exclude=[]),
		version = '0.9.3',
		version = '0.9.4',
		license='MIT',
		description = 'AudioLM - Language Modeling Approach to Audio Generation from Google Research - Pytorch',
		author = 'Phil Wang',