Hi! i can try run tts, but i have some errors, like this below.
But i try different models and configs with different git history, but errors dont leave me
Loading TTS model âŚ
| > model config: C:\Users\SDE-02\PycharmProjects\TTS1\config.json
| > model file: checkpoint_272976.pth.tar
Setting up Audio ProcessorâŚ
| > sample_rate:22050
| > num_mels:80
| > min_level_db:-100
| > frame_shift_ms:12.5
| > frame_length_ms:50
| > ref_level_db:20
| > num_freq:1025
| > power:1.5
| > preemphasis:0.98
| > griffin_lim_iters:60
| > signal_norm:True
| > symmetric_norm:False
| > mel_fmin:0
| > mel_fmax:8000.0
| > max_norm:1.0
| > clip_norm:True
| > do_trim_silence:True
| > n_fft:2048
| > hop_length:275
| > win_length:1102
Using model: Tacotron2
Traceback (most recent call last):
File âC:/Users/SDE-02/PycharmProjects/TTS1/server/test1.pyâ, line 5, in
synthesizer = Synthesizer(config)
File âC:\Users\SDE-02\PycharmProjects\TTS1\server\synthesizer.pyâ, line 29, in init
self.load_tts(self.config.tts_path, self.config.tts_file, self.config.tts_config, config.use_cuda)
File âC:\Users\SDE-02\PycharmProjects\TTS1\server\synthesizer.pyâ, line 61, in load_tts
self.tts_model.load_state_dict(cp[âmodelâ])
File âC:\Users\SDE-02\AppData\Local\Programs\Python\Python36\lib\site-packages\torch\nn\modules\module.pyâ, line 845, in load_state_dict
self.class.name, â\n\tâ.join(error_msgs)))
RuntimeError: Error(s) in loading state_dict for Tacotron2:
Missing key(s) in state_dict: âencoder.convolutions.0.net.0.weightâ, âencoder.convolutions.0.net.0.biasâ, âencoder.convolutions.0.net.1.weightâ, âencoder.convolutions.0.net.1.biasâ, âencoder.convolutions.0.net.1.running_meanâ, âencoder.convolutions.0.net.1.running_varâ, âencoder.convolutions.1.net.0.weightâ, âencoder.convolutions.1.net.0.biasâ, âencoder.convolutions.1.net.1.weightâ, âencoder.convolutions.1.net.1.biasâ, âencoder.convolutions.1.net.1.running_meanâ, âencoder.convolutions.1.net.1.running_varâ, âencoder.convolutions.2.net.0.weightâ, âencoder.convolutions.2.net.0.biasâ, âencoder.convolutions.2.net.1.weightâ, âencoder.convolutions.2.net.1.biasâ, âencoder.convolutions.2.net.1.running_meanâ, âencoder.convolutions.2.net.1.running_varâ, âencoder.lstm.weight_ih_l0â, âencoder.lstm.weight_hh_l0â, âencoder.lstm.bias_ih_l0â, âencoder.lstm.bias_hh_l0â, âencoder.lstm.weight_ih_l0_reverseâ, âencoder.lstm.weight_hh_l0_reverseâ, âencoder.lstm.bias_ih_l0_reverseâ, âencoder.lstm.bias_hh_l0_reverseâ, âdecoder.prenet.layers.0.linear_layer.weightâ, âdecoder.prenet.layers.1.linear_layer.weightâ, âdecoder.attention_rnn.weight_ihâ, âdecoder.attention_rnn.weight_hhâ, âdecoder.attention_rnn.bias_ihâ, âdecoder.attention_rnn.bias_hhâ, âdecoder.attention_layer.query_layer.linear_layer.weightâ, âdecoder.attention_layer.inputs_layer.linear_layer.weightâ, âdecoder.attention_layer.v.linear_layer.weightâ, âdecoder.attention_layer.v.linear_layer.biasâ, âdecoder.decoder_rnn.weight_ihâ, âdecoder.decoder_rnn.weight_hhâ, âdecoder.decoder_rnn.bias_ihâ, âdecoder.decoder_rnn.bias_hhâ, âdecoder.linear_projection.linear_layer.weightâ, âdecoder.linear_projection.linear_layer.biasâ, âdecoder.stopnet.1.linear_layer.weightâ, âdecoder.stopnet.1.linear_layer.biasâ, âdecoder.attention_rnn_init.weightâ, âdecoder.go_frame_init.weightâ, âdecoder.decoder_rnn_inits.weightâ, âpostnet.convolutions.0.net.0.weightâ, âpostnet.convolutions.0.net.0.biasâ, âpostnet.convolutions.0.net.1.weightâ, âpostnet.convolutions.0.net.1.biasâ, âpostnet.convolutions.0.net.1.running_meanâ, âpostnet.convolutions.0.net.1.running_varâ, âpostnet.convolutions.1.net.0.weightâ, âpostnet.convolutions.1.net.0.biasâ, âpostnet.convolutions.1.net.1.weightâ, âpostnet.convolutions.1.net.1.biasâ, âpostnet.convolutions.1.net.1.running_meanâ, âpostnet.convolutions.1.net.1.running_varâ, âpostnet.convolutions.2.net.0.weightâ, âpostnet.convolutions.2.net.0.biasâ, âpostnet.convolutions.2.net.1.weightâ, âpostnet.convolutions.2.net.1.biasâ, âpostnet.convolutions.2.net.1.running_meanâ, âpostnet.convolutions.2.net.1.running_varâ, âpostnet.convolutions.3.net.0.weightâ, âpostnet.convolutions.3.net.0.biasâ, âpostnet.convolutions.3.net.1.weightâ, âpostnet.convolutions.3.net.1.biasâ, âpostnet.convolutions.3.net.1.running_meanâ, âpostnet.convolutions.3.net.1.running_varâ, âpostnet.convolutions.4.net.0.weightâ, âpostnet.convolutions.4.net.0.biasâ, âpostnet.convolutions.4.net.1.weightâ, âpostnet.convolutions.4.net.1.biasâ, âpostnet.convolutions.4.net.1.running_meanâ, âpostnet.convolutions.4.net.1.running_varâ.
Unexpected key(s) in state_dict: âlast_linear.weightâ, âlast_linear.biasâ, âencoder.prenet.layers.0.weightâ, âencoder.prenet.layers.0.biasâ, âencoder.prenet.layers.1.weightâ, âencoder.prenet.layers.1.biasâ, âencoder.cbhg.conv1d_banks.0.conv1d.weightâ, âencoder.cbhg.conv1d_banks.0.bn.weightâ, âencoder.cbhg.conv1d_banks.0.bn.biasâ, âencoder.cbhg.conv1d_banks.0.bn.running_meanâ, âencoder.cbhg.conv1d_banks.0.bn.running_varâ, âencoder.cbhg.conv1d_banks.1.conv1d.weightâ, âencoder.cbhg.conv1d_banks.1.bn.weightâ, âencoder.cbhg.conv1d_banks.1.bn.biasâ, âencoder.cbhg.conv1d_banks.1.bn.running_meanâ, âencoder.cbhg.conv1d_banks.1.bn.running_varâ, âencoder.cbhg.conv1d_banks.2.conv1d.weightâ, âencoder.cbhg.conv1d_banks.2.bn.weightâ, âencoder.cbhg.conv1d_banks.2.bn.biasâ, âencoder.cbhg.conv1d_banks.2.bn.running_meanâ, âencoder.cbhg.conv1d_banks.2.bn.running_varâ, âencoder.cbhg.conv1d_banks.3.conv1d.weightâ, âencoder.cbhg.conv1d_banks.3.bn.weightâ, âencoder.cbhg.conv1d_banks.3.bn.biasâ, âencoder.cbhg.conv1d_banks.3.bn.running_meanâ, âencoder.cbhg.conv1d_banks.3.bn.running_varâ, âencoder.cbhg.conv1d_banks.4.conv1d.weightâ, âencoder.cbhg.conv1d_banks.4.bn.weightâ, âencoder.cbhg.conv1d_banks.4.bn.biasâ, âencoder.cbhg.conv1d_banks.4.bn.running_meanâ, âencoder.cbhg.conv1d_banks.4.bn.running_varâ, âencoder.cbhg.conv1d_banks.5.conv1d.weightâ, âencoder.cbhg.conv1d_banks.5.bn.weightâ, âencoder.cbhg.conv1d_banks.5.bn.biasâ, âencoder.cbhg.conv1d_banks.5.bn.running_meanâ, âencoder.cbhg.conv1d_banks.5.bn.running_varâ, âencoder.cbhg.conv1d_banks.6.conv1d.weightâ, âencoder.cbhg.conv1d_banks.6.bn.weightâ, âencoder.cbhg.conv1d_banks.6.bn.biasâ, âencoder.cbhg.conv1d_banks.6.bn.running_meanâ, âencoder.cbhg.conv1d_banks.6.bn.running_varâ, âencoder.cbhg.conv1d_banks.7.conv1d.weightâ, âencoder.cbhg.conv1d_banks.7.bn.weightâ, âencoder.cbhg.conv1d_banks.7.bn.biasâ, âencoder.cbhg.conv1d_banks.7.bn.running_meanâ, âencoder.cbhg.conv1d_banks.7.bn.running_varâ, âencoder.cbhg.conv1d_banks.8.conv1d.weightâ, âencoder.cbhg.conv1d_banks.8.bn.weightâ, âencoder.cbhg.conv1d_banks.8.bn.biasâ, âencoder.cbhg.conv1d_banks.8.bn.running_meanâ, âencoder.cbhg.conv1d_banks.8.bn.running_varâ, âencoder.cbhg.conv1d_banks.9.conv1d.weightâ, âencoder.cbhg.conv1d_banks.9.bn.weightâ, âencoder.cbhg.conv1d_banks.9.bn.biasâ, âencoder.cbhg.conv1d_banks.9.bn.running_meanâ, âencoder.cbhg.conv1d_banks.9.bn.running_varâ, âencoder.cbhg.conv1d_banks.10.conv1d.weightâ, âencoder.cbhg.conv1d_banks.10.bn.weightâ, âencoder.cbhg.conv1d_banks.10.bn.biasâ, âencoder.cbhg.conv1d_banks.10.bn.running_meanâ, âencoder.cbhg.conv1d_banks.10.bn.running_varâ, âencoder.cbhg.conv1d_banks.11.conv1d.weightâ, âencoder.cbhg.conv1d_banks.11.bn.weightâ, âencoder.cbhg.conv1d_banks.11.bn.biasâ, âencoder.cbhg.conv1d_banks.11.bn.running_meanâ, âencoder.cbhg.conv1d_banks.11.bn.running_varâ, âencoder.cbhg.conv1d_banks.12.conv1d.weightâ, âencoder.cbhg.conv1d_banks.12.bn.weightâ, âencoder.cbhg.conv1d_banks.12.bn.biasâ, âencoder.cbhg.conv1d_banks.12.bn.running_meanâ, âencoder.cbhg.conv1d_banks.12.bn.running_varâ, âencoder.cbhg.conv1d_banks.13.conv1d.weightâ, âencoder.cbhg.conv1d_banks.13.bn.weightâ, âencoder.cbhg.conv1d_banks.13.bn.biasâ, âencoder.cbhg.conv1d_banks.13.bn.running_meanâ, âencoder.cbhg.conv1d_banks.13.bn.running_varâ, âencoder.cbhg.conv1d_banks.14.conv1d.weightâ, âencoder.cbhg.conv1d_banks.14.bn.weightâ, âencoder.cbhg.conv1d_banks.14.bn.biasâ, âencoder.cbhg.conv1d_banks.14.bn.running_meanâ, âencoder.cbhg.conv1d_banks.14.bn.running_varâ, âencoder.cbhg.conv1d_banks.15.conv1d.weightâ, âencoder.cbhg.conv1d_banks.15.bn.weightâ, âencoder.cbhg.conv1d_banks.15.bn.biasâ, âencoder.cbhg.conv1d_banks.15.bn.running_meanâ, âencoder.cbhg.conv1d_banks.15.bn.running_varâ, âencoder.cbhg.conv1d_projections.0.conv1d.weightâ, âencoder.cbhg.conv1d_projections.0.bn.weightâ, âencoder.cbhg.conv1d_projections.0.bn.biasâ, âencoder.cbhg.conv1d_projections.0.bn.running_meanâ, âencoder.cbhg.conv1d_projections.0.bn.running_varâ, âencoder.cbhg.conv1d_projections.1.conv1d.weightâ, âencoder.cbhg.conv1d_projections.1.bn.weightâ, âencoder.cbhg.conv1d_projections.1.bn.biasâ, âencoder.cbhg.conv1d_projections.1.bn.running_meanâ, âencoder.cbhg.conv1d_projections.1.bn.running_varâ, âencoder.cbhg.pre_highway.weightâ, âencoder.cbhg.highways.0.H.weightâ, âencoder.cbhg.highways.0.H.biasâ, âencoder.cbhg.highways.0.T.weightâ, âencoder.cbhg.highways.0.T.biasâ, âencoder.cbhg.highways.1.H.weightâ, âencoder.cbhg.highways.1.H.biasâ, âencoder.cbhg.highways.1.T.weightâ, âencoder.cbhg.highways.1.T.biasâ, âencoder.cbhg.highways.2.H.weightâ, âencoder.cbhg.highways.2.H.biasâ, âencoder.cbhg.highways.2.T.weightâ, âencoder.cbhg.highways.2.T.biasâ, âencoder.cbhg.highways.3.H.weightâ, âencoder.cbhg.highways.3.H.biasâ, âencoder.cbhg.highways.3.T.weightâ, âencoder.cbhg.highways.3.T.biasâ, âencoder.cbhg.gru.weight_ih_l0â, âencoder.cbhg.gru.weight_hh_l0â, âencoder.cbhg.gru.bias_ih_l0â, âencoder.cbhg.gru.bias_hh_l0â, âencoder.cbhg.gru.weight_ih_l0_reverseâ, âencoder.cbhg.gru.weight_hh_l0_reverseâ, âencoder.cbhg.gru.bias_ih_l0_reverseâ, âencoder.cbhg.gru.bias_hh_l0_reverseâ, âdecoder.project_to_decoder_in.weightâ, âdecoder.project_to_decoder_in.biasâ, âdecoder.decoder_rnns.0.weight_ihâ, âdecoder.decoder_rnns.0.weight_hhâ, âdecoder.decoder_rnns.0.bias_ihâ, âdecoder.decoder_rnns.0.bias_hhâ, âdecoder.decoder_rnns.1.weight_ihâ, âdecoder.decoder_rnns.1.weight_hhâ, âdecoder.decoder_rnns.1.bias_ihâ, âdecoder.decoder_rnns.1.bias_hhâ, âdecoder.proj_to_mel.weightâ, âdecoder.proj_to_mel.biasâ, âdecoder.prenet.layers.0.weightâ, âdecoder.prenet.layers.0.biasâ, âdecoder.prenet.layers.1.weightâ, âdecoder.prenet.layers.1.biasâ, âdecoder.attention_rnn.rnn_cell.weight_ihâ, âdecoder.attention_rnn.rnn_cell.weight_hhâ, âdecoder.attention_rnn.rnn_cell.bias_ihâ, âdecoder.attention_rnn.rnn_cell.bias_hhâ, âdecoder.attention_rnn.alignment_model.query_layer.weightâ, âdecoder.attention_rnn.alignment_model.query_layer.biasâ, âdecoder.attention_rnn.alignment_model.annot_layer.weightâ, âdecoder.attention_rnn.alignment_model.annot_layer.biasâ, âdecoder.attention_rnn.alignment_model.v.weightâ, âdecoder.stopnet.rnn.weight_ihâ, âdecoder.stopnet.rnn.weight_hhâ, âdecoder.stopnet.rnn.bias_ihâ, âdecoder.stopnet.rnn.bias_hhâ, âdecoder.stopnet.linear.weightâ, âdecoder.stopnet.linear.biasâ, âpostnet.conv1d_banks.0.conv1d.weightâ, âpostnet.conv1d_banks.0.bn.weightâ, âpostnet.conv1d_banks.0.bn.biasâ, âpostnet.conv1d_banks.0.bn.running_meanâ, âpostnet.conv1d_banks.0.bn.running_varâ, âpostnet.conv1d_banks.1.conv1d.weightâ, âpostnet.conv1d_banks.1.bn.weightâ, âpostnet.conv1d_banks.1.bn.biasâ, âpostnet.conv1d_banks.1.bn.running_meanâ, âpostnet.conv1d_banks.1.bn.running_varâ, âpostnet.conv1d_banks.2.conv1d.weightâ, âpostnet.conv1d_banks.2.bn.weightâ, âpostnet.conv1d_banks.2.bn.biasâ, âpostnet.conv1d_banks.2.bn.running_meanâ, âpostnet.conv1d_banks.2.bn.running_varâ, âpostnet.conv1d_banks.3.conv1d.weightâ, âpostnet.conv1d_banks.3.bn.weightâ, âpostnet.conv1d_banks.3.bn.biasâ, âpostnet.conv1d_banks.3.bn.running_meanâ, âpostnet.conv1d_banks.3.bn.running_varâ, âpostnet.conv1d_banks.4.conv1d.weightâ, âpostnet.conv1d_banks.4.bn.weightâ, âpostnet.conv1d_banks.4.bn.biasâ, âpostnet.conv1d_banks.4.bn.running_meanâ, âpostnet.conv1d_banks.4.bn.running_varâ, âpostnet.conv1d_banks.5.conv1d.weightâ, âpostnet.conv1d_banks.5.bn.weightâ, âpostnet.conv1d_banks.5.bn.biasâ, âpostnet.conv1d_banks.5.bn.running_meanâ, âpostnet.conv1d_banks.5.bn.running_varâ, âpostnet.conv1d_banks.6.conv1d.weightâ, âpostnet.conv1d_banks.6.bn.weightâ, âpostnet.conv1d_banks.6.bn.biasâ, âpostnet.conv1d_banks.6.bn.running_meanâ, âpostnet.conv1d_banks.6.bn.running_varâ, âpostnet.conv1d_banks.7.conv1d.weightâ, âpostnet.conv1d_banks.7.bn.weightâ, âpostnet.conv1d_banks.7.bn.biasâ, âpostnet.conv1d_banks.7.bn.running_meanâ, âpostnet.conv1d_banks.7.bn.running_varâ, âpostnet.conv1d_projections.0.conv1d.weightâ, âpostnet.conv1d_projections.0.bn.weightâ, âpostnet.conv1d_projections.0.bn.biasâ, âpostnet.conv1d_projections.0.bn.running_meanâ, âpostnet.conv1d_projections.0.bn.running_varâ, âpostnet.conv1d_projections.1.conv1d.weightâ, âpostnet.conv1d_projections.1.bn.weightâ, âpostnet.conv1d_projections.1.bn.biasâ, âpostnet.conv1d_projections.1.bn.running_meanâ, âpostnet.conv1d_projections.1.bn.running_varâ, âpostnet.pre_highway.weightâ, âpostnet.highways.0.H.weightâ, âpostnet.highways.0.H.biasâ, âpostnet.highways.0.T.weightâ, âpostnet.highways.0.T.biasâ, âpostnet.highways.1.H.weightâ, âpostnet.highways.1.H.biasâ, âpostnet.highways.1.T.weightâ, âpostnet.highways.1.T.biasâ, âpostnet.highways.2.H.weightâ, âpostnet.highways.2.H.biasâ, âpostnet.highways.2.T.weightâ, âpostnet.highways.2.T.biasâ, âpostnet.highways.3.H.weightâ, âpostnet.highways.3.H.biasâ, âpostnet.highways.3.T.weightâ, âpostnet.highways.3.T.biasâ, âpostnet.gru.weight_ih_l0â, âpostnet.gru.weight_hh_l0â, âpostnet.gru.bias_ih_l0â, âpostnet.gru.bias_hh_l0â, âpostnet.gru.weight_ih_l0_reverseâ, âpostnet.gru.weight_hh_l0_reverseâ, âpostnet.gru.bias_ih_l0_reverseâ, âpostnet.gru.bias_hh_l0_reverseâ.
size mismatch for embedding.weight: copying a param with shape torch.Size([149, 256]) from checkpoint, the shape in current model is torch.Size([130, 512]).