params_data.py 901 B

1234567891011121314151617181920212223242526272829
  1. ## Mel-filterbank
  2. mel_window_length = 25 # In milliseconds
  3. mel_window_step = 10 # In milliseconds
  4. mel_n_channels = 40
  5. ## Audio
  6. sampling_rate = 16000
  7. # Number of spectrogram frames in a partial utterance
  8. partials_n_frames = 160 # 1600 ms
  9. # Number of spectrogram frames at inference
  10. inference_n_frames = 80 # 800 ms
  11. ## Voice Activation Detection
  12. # Window size of the VAD. Must be either 10, 20 or 30 milliseconds.
  13. # This sets the granularity of the VAD. Should not need to be changed.
  14. vad_window_length = 30 # In milliseconds
  15. # Number of frames to average together when performing the moving average smoothing.
  16. # The larger this value, the larger the VAD variations must be to not get smoothed out.
  17. vad_moving_average_width = 8
  18. # Maximum number of consecutive silent frames a segment can have.
  19. vad_max_silence_length = 6
  20. ## Audio volume normalization
  21. audio_norm_target_dBFS = -30