Skip to content

Commit c5ac204

Browse files
feat: add noisy autoencoder option
1 parent 5950759 commit c5ac204

File tree

2 files changed

+6
-2
lines changed

2 files changed

+6
-2
lines changed

audio_diffusion_pytorch/modules.py

Lines changed: 5 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1118,11 +1118,13 @@ def __init__(
11181118
multipliers: Sequence[int],
11191119
factors: Sequence[int],
11201120
num_blocks: Sequence[int],
1121+
use_noisy: bool = False,
11211122
bottleneck: Optional[Bottleneck] = None,
11221123
):
11231124
super().__init__()
11241125
num_layers = len(multipliers) - 1
11251126
self.bottleneck = bottleneck
1127+
self.use_noisy = use_noisy
11261128

11271129
assert len(factors) >= num_layers and len(num_blocks) >= num_layers
11281130

@@ -1150,7 +1152,7 @@ def __init__(
11501152
self.upsamples = nn.ModuleList(
11511153
[
11521154
UpsampleBlock1d(
1153-
in_channels=channels * multipliers[i + 1],
1155+
in_channels=channels * multipliers[i + 1] * (use_noisy + 1),
11541156
out_channels=channels * multipliers[i],
11551157
factor=factors[i],
11561158
num_groups=resnet_groups,
@@ -1183,6 +1185,8 @@ def encode(
11831185

11841186
def decode(self, x: Tensor) -> Tensor:
11851187
for upsample in self.upsamples:
1188+
if self.use_noisy:
1189+
x = torch.cat([x, torch.randn_like(x)], dim=1)
11861190
x = upsample(x)
11871191
return self.to_out(x)
11881192

setup.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -3,7 +3,7 @@
33
setup(
44
name="audio-diffusion-pytorch",
55
packages=find_packages(exclude=[]),
6-
version="0.0.50",
6+
version="0.0.51",
77
license="MIT",
88
description="Audio Diffusion - PyTorch",
99
long_description_content_type="text/markdown",

0 commit comments

Comments
 (0)