config.yaml 1.2 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556
  1. frontend: WavFrontendOnline
  2. frontend_conf:
  3. fs: 16000
  4. window: hamming
  5. n_mels: 80
  6. frame_length: 25
  7. frame_shift: 10
  8. dither: 0.0
  9. lfr_m: 5
  10. lfr_n: 1
  11. model: FsmnVADStreaming
  12. model_conf:
  13. sample_rate: 16000
  14. detect_mode: 1
  15. snr_mode: 0
  16. max_end_silence_time: 800
  17. max_start_silence_time: 3000
  18. do_start_point_detection: True
  19. do_end_point_detection: True
  20. window_size_ms: 200
  21. sil_to_speech_time_thres: 150
  22. speech_to_sil_time_thres: 150
  23. speech_2_noise_ratio: 1.0
  24. do_extend: 1
  25. lookback_time_start_point: 200
  26. lookahead_time_end_point: 100
  27. max_single_segment_time: 60000
  28. snr_thres: -100.0
  29. noise_frame_num_used_for_snr: 100
  30. decibel_thres: -100.0
  31. speech_noise_thres: 0.6
  32. fe_prior_thres: 0.0001
  33. silence_pdf_num: 1
  34. sil_pdf_ids: [0]
  35. speech_noise_thresh_low: -0.1
  36. speech_noise_thresh_high: 0.3
  37. output_frame_probs: False
  38. frame_in_ms: 10
  39. frame_length_ms: 25
  40. encoder: FSMN
  41. encoder_conf:
  42. input_dim: 400
  43. input_affine_dim: 140
  44. fsmn_layers: 4
  45. linear_dim: 250
  46. proj_dim: 128
  47. lorder: 20
  48. rorder: 0
  49. lstride: 1
  50. rstride: 0
  51. output_affine_dim: 140
  52. output_dim: 248