Computation of the spectrogam & mel-filter bank features.
See ./scripts/sptk/compute_{spectrogram,fbank}.py -h
-
Spectrogram
# 257-dim log spectrogram echo "egs asset/egs.wav" | ../../scripts/sptk/compute_spectrogram.py \ --frame-len 400 \ --frame-hop 256 \ --round-power-of-two true \ --center true \ --apply-log true \ - feats.ark # visualize and check ../../scripts/sptk/visualize_tf_matrix.py \ --input ark --cmap jet --frame-hop 256 \ feats.ark
-
Fbank
# 80-dim log fbank echo "egs asset/egs.wav" | ../../scripts/sptk/compute_fbank.py \ --frame-len 400 \ --frame-hop 256 \ --round-power-of-two true \ --center true \ --apply-log true \ --num-bins 80 \ - feats.ark # visualize and check ../../scripts/sptk/visualize_tf_matrix.py \ --input ark --cmap jet --frame-hop 256 \ feats.ark