shark8me · September 16, 2022 13:45
diff --git a/convstack2d.py b/convstack2d.py
 class ConvStack2d(nn.Module):
    def __init__(self, input_features, output_features):
        super().__init__()

        # input is batch_size * 1 channel * frames * input_features
        self.cnn = nn.Sequential(
            # layer 0
            nn.Conv2d(1, output_features // 16, (3, 3), padding=1),
            nn.BatchNorm2d(output_features // 16),
            nn.ReLU(),
            # layer 1
            nn.Conv2d(output_features // 16, output_features // 16, (3, 3), padding=1),
            nn.BatchNorm2d(output_features // 16),
            nn.ReLU(),
            # layer 2
            nn.MaxPool2d((1, 2)),
            nn.Dropout(0.25),
            nn.Conv2d(output_features // 16, output_features // 8, (3, 3), padding=1),
            nn.BatchNorm2d(output_features // 8),
            nn.ReLU(),
            # layer 3
            nn.MaxPool2d((1, 2)),
            nn.Dropout(0.25),
        )
        self.fc = nn.Sequential(
            nn.Linear((output_features // 8) * (input_features // 4), output_features),
            nn.Linear(output_features,1)
        )
        self.fc2 = nn.Sequential(
            nn.Linear(num_steps,output_features)
        )

    def forward(self, mel):
        x = mel.view(mel.size(0), 1, mel.size(1), mel.size(2))
        x = self.cnn(x)
        x = x.transpose(1, 2).flatten(-2)
        x = self.fc(x)
        x= torch.squeeze(x)
        x = self.fc2(x)
        return x
	class ConvStack2d(nn.Module):
	def __init__(self, input_features, output_features):
	super().__init__()

	# input is batch_size * 1 channel * frames * input_features
	self.cnn = nn.Sequential(
	# layer 0
	nn.Conv2d(1, output_features // 16, (3, 3), padding=1),
	nn.BatchNorm2d(output_features // 16),
	nn.ReLU(),
	# layer 1
	nn.Conv2d(output_features // 16, output_features // 16, (3, 3), padding=1),
	nn.BatchNorm2d(output_features // 16),
	nn.ReLU(),
	# layer 2
	nn.MaxPool2d((1, 2)),
	nn.Dropout(0.25),
	nn.Conv2d(output_features // 16, output_features // 8, (3, 3), padding=1),
	nn.BatchNorm2d(output_features // 8),
	nn.ReLU(),
	# layer 3
	nn.MaxPool2d((1, 2)),
	nn.Dropout(0.25),
	)
	self.fc = nn.Sequential(
	nn.Linear((output_features // 8) * (input_features // 4), output_features),
	nn.Linear(output_features,1)
	)
	self.fc2 = nn.Sequential(
	nn.Linear(num_steps,output_features)
	)

	def forward(self, mel):
	x = mel.view(mel.size(0), 1, mel.size(1), mel.size(2))
	x = self.cnn(x)
	x = x.transpose(1, 2).flatten(-2)
	x = self.fc(x)
	x= torch.squeeze(x)
	x = self.fc2(x)
	return x
No results found