Loading audiolm_pytorch/audiolm_pytorch.py +2 −2 Original line number Diff line number Diff line Loading @@ -592,7 +592,7 @@ class CoarseTransformer(nn.Module): codebook_size_with_eos = codebook_size + 1 self.coarse_embedding = nn.Embedding(num_coarse_quantizers * codebook_size_with_eos, dim) text_dim = get_encoded_dim(t5_name) text_dim = default(cond_dim, get_encoded_dim(t5_name)) self.proj_text_embed = nn.Linear(text_dim, dim, bias = False) if text_dim != dim else nn.Identity() self.transformer = Transformer( Loading Loading @@ -767,7 +767,7 @@ class FineTransformer(nn.Module): self.eos_id = codebook_size text_dim = get_encoded_dim(t5_name) text_dim = default(cond_dim, get_encoded_dim(t5_name)) self.proj_text_embed = nn.Linear(text_dim, dim, bias = False) if text_dim != dim else nn.Identity() self.transformer = Transformer( Loading setup.py +1 −1 Original line number Diff line number Diff line Loading @@ -3,7 +3,7 @@ from setuptools import setup, find_packages setup( name = 'audiolm-pytorch', packages = find_packages(exclude=[]), version = '0.9.3', version = '0.9.4', license='MIT', description = 'AudioLM - Language Modeling Approach to Audio Generation from Google Research - Pytorch', author = 'Phil Wang', Loading Loading
audiolm_pytorch/audiolm_pytorch.py +2 −2 Original line number Diff line number Diff line Loading @@ -592,7 +592,7 @@ class CoarseTransformer(nn.Module): codebook_size_with_eos = codebook_size + 1 self.coarse_embedding = nn.Embedding(num_coarse_quantizers * codebook_size_with_eos, dim) text_dim = get_encoded_dim(t5_name) text_dim = default(cond_dim, get_encoded_dim(t5_name)) self.proj_text_embed = nn.Linear(text_dim, dim, bias = False) if text_dim != dim else nn.Identity() self.transformer = Transformer( Loading Loading @@ -767,7 +767,7 @@ class FineTransformer(nn.Module): self.eos_id = codebook_size text_dim = get_encoded_dim(t5_name) text_dim = default(cond_dim, get_encoded_dim(t5_name)) self.proj_text_embed = nn.Linear(text_dim, dim, bias = False) if text_dim != dim else nn.Identity() self.transformer = Transformer( Loading
setup.py +1 −1 Original line number Diff line number Diff line Loading @@ -3,7 +3,7 @@ from setuptools import setup, find_packages setup( name = 'audiolm-pytorch', packages = find_packages(exclude=[]), version = '0.9.3', version = '0.9.4', license='MIT', description = 'AudioLM - Language Modeling Approach to Audio Generation from Google Research - Pytorch', author = 'Phil Wang', Loading