| { | |
| "architectures": [ | |
| "FastSpeech2ConformerModel" | |
| ], | |
| "decoder_config": { | |
| "attention_dropout_rate": 0.2, | |
| "concat_after": false, | |
| "dropout_rate": 0.2, | |
| "kernel_size": 31, | |
| "layers": 4, | |
| "linear_units": 1536, | |
| "normalize_before": false, | |
| "num_attention_heads": 2, | |
| "positional_dropout_rate": 0.2 | |
| }, | |
| "duration_predictor_channels": 256, | |
| "duration_predictor_dropout_rate": 0.2, | |
| "duration_predictor_kernel_size": 3, | |
| "duration_predictor_layers": 2, | |
| "encoder_config": { | |
| "attention_dropout_rate": 0.2, | |
| "concat_after": false, | |
| "dropout_rate": 0.2, | |
| "kernel_size": 7, | |
| "layers": 4, | |
| "linear_units": 1536, | |
| "normalize_before": false, | |
| "num_attention_heads": 2, | |
| "positional_dropout_rate": 0.2 | |
| }, | |
| "encoder_layers": 4, | |
| "encoder_num_attention_heads": 2, | |
| "energy_embed_dropout": 0.0, | |
| "energy_embed_kernel_size": 1, | |
| "energy_predictor_channels": 256, | |
| "energy_predictor_dropout": 0.5, | |
| "energy_predictor_kernel_size": 3, | |
| "energy_predictor_layers": 2, | |
| "hidden_size": 384, | |
| "input_dim": 78, | |
| "is_encoder_decoder": true, | |
| "max_source_positions": 5000, | |
| "model_type": "fastspeech2_conformer", | |
| "num_languages": null, | |
| "num_mel_bins": 80, | |
| "num_speakers": null, | |
| "pitch_embed_dropout": 0.0, | |
| "pitch_embed_kernel_size": 1, | |
| "pitch_predictor_channels": 256, | |
| "pitch_predictor_dropout": 0.5, | |
| "pitch_predictor_kernel_size": 5, | |
| "pitch_predictor_layers": 5, | |
| "positionwise_conv_kernel_size": 3, | |
| "reduction_factor": 1, | |
| "speaker_embed_dim": null, | |
| "speaking_speed": 1.0, | |
| "speech_decoder_postnet_dropout": 0.5, | |
| "speech_decoder_postnet_kernel": 5, | |
| "speech_decoder_postnet_layers": 5, | |
| "speech_decoder_postnet_units": 256, | |
| "stop_gradient_from_energy_predictor": false, | |
| "stop_gradient_from_pitch_predictor": true, | |
| "torch_dtype": "float32", | |
| "transformers_version": "4.33.0.dev0", | |
| "use_cnn_in_conformer": true, | |
| "use_macaron_style_in_conformer": true, | |
| "use_masking": true, | |
| "use_weighted_masking": false, | |
| "vocab_size": 78 | |
| } | |