Skip to content

Commit fdf1531

Browse files
committed
period discriminator periods
1 parent 104fb93 commit fdf1531

File tree

5 files changed

+13
-9
lines changed

5 files changed

+13
-9
lines changed

configs/48k_base.json

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -63,6 +63,7 @@
6363
"upsample_kernel_sizes": [16,16,4,4],
6464
"n_layers_q": 3,
6565
"use_spectral_norm": false,
66-
"gin_channels": 256
66+
"gin_channels": 256,
67+
"multi_period_discriminator_periods": [2, 3, 5, 7, 11, 13, 17, 19, 23, 29, 31, 37]
6768
}
6869
}

infer.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -23,7 +23,7 @@
2323
import torchaudio
2424

2525
if torch.cuda.is_available():
26-
device = "cuda:6"
26+
device = "cuda:5"
2727
else:
2828
device = "cpu"
2929

@@ -90,4 +90,4 @@ def convert(source_audio: str, target_audio: str, speaker_id: int, pitch_shift:
9090

9191
sf.write(target_audio, y_hat[0,:,:y_hat_lengths[0]].squeeze(0).detach().numpy(), hparams.data.target_sampling_rate, subtype='PCM_24')
9292

93-
convert("ncwlq_01.wav", 'out.wav', 143, 0)
93+
convert("ncwlq_01.wav", 'out.wav', 256, 0)

vits/model/discriminators/multi_period_discriminator.py

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -1,15 +1,15 @@
11

2+
from typing import List
23
import torch
34
from torch import nn
45
from torch.nn import functional as F
56

67
from .discriminator import DiscriminatorP, DiscriminatorS
78

89
class MultiPeriodDiscriminator(torch.nn.Module):
9-
def __init__(self, use_spectral_norm=False):
10+
def __init__(self, periods: List[int]=[2, 3, 5, 7, 11, 17, 23, 37], use_spectral_norm: bool=False):
1011
super(MultiPeriodDiscriminator, self).__init__()
11-
periods = [2,3,5,7,11]
12-
12+
self.periods = periods
1313
discs = [DiscriminatorS(use_spectral_norm=use_spectral_norm)]
1414
discs = discs + [DiscriminatorP(i, use_spectral_norm=use_spectral_norm) for i in periods]
1515
self.discriminators = nn.ModuleList(discs)

vits/model/synthesizers/synthesizer_svc.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -57,8 +57,8 @@ def __init__(self, spec_channels, segment_size,
5757
self.enc_p = HubertContentEncoder(kwargs["hubert_ckpt"], inter_channels, hidden_channels, filter_channels,
5858
n_heads, n_layers, kernel_size, p_dropout, hubert_channels, num_pitch)
5959
self.dec = torch.hub.load("vtuber-plan/hifi-gan:v0.3.1", "hifigan_48k")
60-
for param in self.dec.parameters():
61-
param.requires_grad = False
60+
# for param in self.dec.parameters():
61+
# param.requires_grad = False
6262
self.enc_q = PosteriorEncoder(spec_channels, inter_channels, hidden_channels, 5, 1, 16, gin_channels=gin_channels)
6363
self.flow = ResidualCouplingBlock(inter_channels, hidden_channels, 5, 1, 4, gin_channels=gin_channels)
6464

vits/model/vcvits.py

Lines changed: 4 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -35,7 +35,10 @@ def __init__(self, **kwargs):
3535
self.hparams.train.segment_size // self.hparams.data.hop_length,
3636
n_speakers=self.hparams.data.n_speakers,
3737
**self.hparams.model)
38-
self.net_period_d = MultiPeriodDiscriminator(self.hparams.model.use_spectral_norm)
38+
self.net_period_d = MultiPeriodDiscriminator(
39+
periods=self.hparams.model.multi_period_discriminator_periods,
40+
use_spectral_norm=self.hparams.model.use_spectral_norm
41+
)
3942
self.net_scale_d = MultiScaleDiscriminator(self.hparams.model.use_spectral_norm)
4043
# self.net_pitch_d = PitchDiscriminator(self.hparams.model.use_spectral_norm)
4144
# speaker discriminator

0 commit comments

Comments
 (0)