config.yaml 810 B

12345678910111213141516171819202122232425262728293031323334353637383940414243444546
  1. model: CTTransformer
  2. model_conf:
  3. ignore_id: 0
  4. embed_unit: 256
  5. att_unit: 256
  6. dropout_rate: 0.1
  7. punc_list:
  8. - <unk>
  9. - _
  10. - ,
  11. - 。
  12. - ?
  13. - 、
  14. punc_weight:
  15. - 1.0
  16. - 1.0
  17. - 1.0
  18. - 1.0
  19. - 1.0
  20. - 1.0
  21. sentence_end_id: 3
  22. encoder: SANMEncoder
  23. encoder_conf:
  24. input_size: 256
  25. output_size: 256
  26. attention_heads: 8
  27. linear_units: 1024
  28. num_blocks: 4
  29. dropout_rate: 0.1
  30. positional_dropout_rate: 0.1
  31. attention_dropout_rate: 0.0
  32. input_layer: pe
  33. pos_enc_class: SinusoidalPositionEncoder
  34. normalize_before: true
  35. kernel_size: 11
  36. sanm_shfit: 0
  37. selfattention_layer_type: sanm
  38. padding_idx: 0
  39. tokenizer: CharTokenizer
  40. tokenizer_conf:
  41. unk_symbol: <unk>