mirror of
https://github.com/FunAudioLLM/CosyVoice.git
synced 2026-02-05 01:49:25 +08:00
Merge pull request #323 from FunAudioLLM/hengwu.zty/zh_example
change dropout_rate to float type
This commit is contained in:
@@ -31,7 +31,7 @@ llm: !new:cosyvoice.llm.llm.TransformerLM
|
|||||||
num_blocks: 3
|
num_blocks: 3
|
||||||
dropout_rate: 0.1
|
dropout_rate: 0.1
|
||||||
positional_dropout_rate: 0.1
|
positional_dropout_rate: 0.1
|
||||||
attention_dropout_rate: 0
|
attention_dropout_rate: 0.0
|
||||||
normalize_before: True
|
normalize_before: True
|
||||||
input_layer: 'linear'
|
input_layer: 'linear'
|
||||||
pos_enc_layer_type: 'rel_pos_espnet'
|
pos_enc_layer_type: 'rel_pos_espnet'
|
||||||
@@ -49,7 +49,7 @@ llm: !new:cosyvoice.llm.llm.TransformerLM
|
|||||||
num_blocks: 7
|
num_blocks: 7
|
||||||
dropout_rate: 0.1
|
dropout_rate: 0.1
|
||||||
positional_dropout_rate: 0.1
|
positional_dropout_rate: 0.1
|
||||||
attention_dropout_rate: 0
|
attention_dropout_rate: 0.0
|
||||||
input_layer: 'linear_legacy'
|
input_layer: 'linear_legacy'
|
||||||
pos_enc_layer_type: 'rel_pos_espnet'
|
pos_enc_layer_type: 'rel_pos_espnet'
|
||||||
selfattention_layer_type: 'rel_selfattn'
|
selfattention_layer_type: 'rel_selfattn'
|
||||||
@@ -97,7 +97,7 @@ flow: !new:cosyvoice.flow.flow.MaskedDiffWithXvec
|
|||||||
in_channels: 320
|
in_channels: 320
|
||||||
out_channels: 80
|
out_channels: 80
|
||||||
channels: [256, 256]
|
channels: [256, 256]
|
||||||
dropout: 0
|
dropout: 0.0
|
||||||
attention_head_dim: 64
|
attention_head_dim: 64
|
||||||
n_blocks: 4
|
n_blocks: 4
|
||||||
num_mid_blocks: 8
|
num_mid_blocks: 8
|
||||||
|
|||||||
@@ -31,7 +31,7 @@ llm: !new:cosyvoice.llm.llm.TransformerLM
|
|||||||
num_blocks: 6
|
num_blocks: 6
|
||||||
dropout_rate: 0.1
|
dropout_rate: 0.1
|
||||||
positional_dropout_rate: 0.1
|
positional_dropout_rate: 0.1
|
||||||
attention_dropout_rate: 0
|
attention_dropout_rate: 0.0
|
||||||
normalize_before: True
|
normalize_before: True
|
||||||
input_layer: 'linear'
|
input_layer: 'linear'
|
||||||
pos_enc_layer_type: 'rel_pos_espnet'
|
pos_enc_layer_type: 'rel_pos_espnet'
|
||||||
@@ -49,7 +49,7 @@ llm: !new:cosyvoice.llm.llm.TransformerLM
|
|||||||
num_blocks: 14
|
num_blocks: 14
|
||||||
dropout_rate: 0.1
|
dropout_rate: 0.1
|
||||||
positional_dropout_rate: 0.1
|
positional_dropout_rate: 0.1
|
||||||
attention_dropout_rate: 0
|
attention_dropout_rate: 0.0
|
||||||
input_layer: 'linear_legacy'
|
input_layer: 'linear_legacy'
|
||||||
pos_enc_layer_type: 'rel_pos_espnet'
|
pos_enc_layer_type: 'rel_pos_espnet'
|
||||||
selfattention_layer_type: 'rel_selfattn'
|
selfattention_layer_type: 'rel_selfattn'
|
||||||
@@ -97,7 +97,7 @@ flow: !new:cosyvoice.flow.flow.MaskedDiffWithXvec
|
|||||||
in_channels: 320
|
in_channels: 320
|
||||||
out_channels: 80
|
out_channels: 80
|
||||||
channels: [256, 256]
|
channels: [256, 256]
|
||||||
dropout: 0
|
dropout: 0.0
|
||||||
attention_head_dim: 64
|
attention_head_dim: 64
|
||||||
n_blocks: 4
|
n_blocks: 4
|
||||||
num_mid_blocks: 12
|
num_mid_blocks: 12
|
||||||
|
|||||||
Reference in New Issue
Block a user