Skip to content

HTTPS clone URL

Subversion checkout URL

You can clone with HTTPS or Subversion.

Download ZIP
tree: 93b4a6c039
Fetching contributors…

Cannot retrieve contributors at this time

executable file 200 lines (162 sloc) 6.193 kb
#!/usr/bin/perl
# Copyright 2011 Matt Shannon
# Copyright 2001-2008 Nagoya Institute of Technology, Department of Computer Science
# Copyright 2001-2008 Tokyo Institute of Technology, Interdisciplinary Graduate School of Science and Engineering
# This file is part of HTS-demo_CMU-ARCTIC-SLT-STRAIGHT-AR-decision-tree.
# See `License` for details of license and warranty.
# Settings ==============================
$spkr = '@SPEAKER@';
$data = '@DATASET@';
$qnum = '@QNUM@';
$ver = '@VER@';
@SET = ('cmp','dur');
@cmp = ('mgc','lf0','bap');
@dur = ('dur');
$ref{'cmp'} = \@cmp;
$ref{'dur'} = \@dur;
%vflr = ('mgc' => '0.01', # variance floors
'lf0' => '0.01',
'bap' => '0.01',
'dur' => '0.01');
%applyMdl = ('cmp' => '0', # apply MDL?
'dur' => '1');
%thr = ('mgc' => '350.0', # clustering log likelihood threshold
'lf0' => '55.0',
'bap' => '60.0',
'dur' => '0.0');
%mdlf = ('cmp' => '1.0', # tree size control param. for MDL
'dur' => '1.0');
%mocc = ('cmp' => '10.0', # minimum occupancy counts
'dur' => ' 5.0');
%gam = ('cmp' => '000', # stats load threshold
'dur' => '000');
%t2s = ('mgc' => 'cmp', # feature type to mmf conversion
'lf0' => 'cmp',
'bap' => 'cmp',
'dur' => 'dur');
%s2ae = ('cmp' => 'hmm.acc', # set to accumulator file extension
'dur' => 'dur.acc');
%strb = ('mgc' => '1', # stream start
'lf0' => '2',
'bap' => '@BAPSTREN@',
'dur' => '1');
%stre = ('mgc' => '1', # stream end
'lf0' => '@F0STREN@',
'bap' => '@BAPSTREN@',
'dur' => '@NSTATE@');
%msdi = ('mgc' => '0', # msd information
'lf0' => '1',
'bap' => '0',
'dur' => '0');
%strw = ('mgc' => '1.0', # stream weights
'lf0' => '1.0',
'bap' => '1.0',
'dur' => '1.0');
%ordr = ('mgc' => '@MGCVSIZE@', # feature order
'lf0' => '1',
'bap' => '5',
'dur' => '@NSTATE@');
%nwin = ('mgc' => '@NMGCWIN@', # number of windows
'lf0' => '@NLF0WIN@',
'bap' => '@NBAPWIN@',
'dur' => '0');
%nblk = ('mgc' => '@NMGCTRANSBLK@', # number of blocks for transforms
'lf0' => '@NLF0TRANSBLK@',
'bap' => '@NBAPTRANSBLK@',
'dur' => '1');
%band = ('mgc' => '@MGCBANDWIDTH@', # band width for transforms
'lf0' => '@LF0BANDWIDTH@',
'bap' => '@BAPBANDWIDTH@',
'dur' => '0');
#%mdcp = ('dy' => 'd', # model copy
# 'A' => 'a',
# 'I' => 'i',
# 'U' => 'u',
# 'E' => 'e',
# 'O' => 'o');
# Speech Analysis/Synthesis Setting ==============
# speech analysis
$sr = @SAMPFREQ@; # sampling rate (Hz)
$fs = @FRAMESHIFT@; # frame period (point)
$fw = @FREQWARP@; # frequency warping
$gm = @GAMMA@; # pole/zero representation weight
$ul = @MGCLSP@; # use MGC-LSPs instead of MGC coefficients
$lg = @LNGAIN@; # use log gain instead of linear gain
$bs = @BYTESWAP@; # 1: big endian, 0: little endian
$fr = $fs/$sr; # frame period (sec)
# speech synthesis
$pf = @PSTFILTER@; # postfiltering factor
$fl = @IMPLEN@; # length of impulse response
$co = 2047; # order of cepstrum to approximate mel-generalized cepstrum
# Modeling/Generation Setting ==============
# modeling
$nState = @NSTATE@; # number of states
$nIte = @NITER@; # number of iterations for embedded training
$beam = '1500 100 5000'; # initial, inc, and upper limit of beam width
$maxdev = @MAXDEV@; # max standard dev coef to control HSMM maximum duration
$mindur = @MINDUR@; # min state duration to be evaluated
$wf = @WFLOOR@; # mixture weight flooring
# generation
$maxEMiter = @MAXEMITER@; # max EM iteration
$EMepsilon = @EMEPSILON@; # convergence factor for EM iteration
$useGV = @USEGV@; # turn on GV
$maxGViter = @MAXGVITER@; # max GV iteration
$GVepsilon = @GVEPSILON@; # convergence factor for GV iteration
$minEucNorm = @MINEUCNORM@; # minimum Euclid norm for GV iteration
$stepInit = @STEPINIT@; # initial step size
$stepInc = @STEPINC@; # step size acceleration factor
$stepDec = @STEPDEC@; # step size deceleration factor
$hmmWeight = @HMMWEIGHT@; # weight for HMM output prob.
$gvWeight = @GVWEIGHT@; # weight for GV output prob.
$optKind = '@OPTKIND@'; # optimization method (STEEPEST, NEWTON, or LBFGS)
# Directories & Commands ===============
# project directories
$prjdir = '@PWD@';
# HTS commands
$HCOMPV = '@HCOMPV@';
$HINIT = '@HINIT@';
$HREST = '@HREST@';
$HEREST = '@HEREST@';
$HHED = '@HHED@';
$HMGENS = '@HMGENS@';
$ENGINE = '@ENGINE@';
# SPTK commands
$X2X = '@X2X@';
$FREQT = '@FREQT@';
$C2ACR = '@C2ACR@';
$VOPR = '@VOPR@';
$MC2B = '@MC2B@';
$SOPR = '@SOPR@';
$B2MC = '@B2MC@';
$LSP2LPC = '@LSP2LPC@';
$MGC2MGC = '@MGC2MGC@';
$MERGE = '@MERGE@';
$BCP = '@BCP@';
$LSPCHECK = '@LSPCHECK@';
$MGC2SP = '@MGC2SP@';
$INTERPOLATE = '@INTERPOLATE@';
$DFS = '@DFS@';
# SoX (to add RIFF header)
$SOX = '@SOX@';
# MATLAB & STRAIGHT
$MATLAB = '@MATLAB@';
$STRAIGHT = '@STRAIGHT@';
# Switch ================================
$MKEMV = 1; # preparing environments
$HCMPV = 1; # computing a global variance
$IN_RE = 1; # initialization & reestimation
$MMMMF = 1; # making a monophone mmf
$ERST0 = 1; # embedded reestimation (monophone)
$MN2FL = 1; # copying monophone mmf to fullcontext one
$ERST1 = 1; # embedded reestimation (fullcontext)
$CXCL1 = 1; # tree-based context clustering
$ERST2 = 1; # embedded reestimation (clustered)
$UNTIE = 1; # untying the parameter sharing structure
$ERST3 = 1; # embedded reestimation (untied)
$CXCL2 = 1; # tree-based context clustering
$ERST4 = 1; # embedded reestimation (re-clustered)
$MKUN1 = 1; # making unseen models (1mix)
$PGEN1 = 1; # generating speech parameter sequences (1mix)
$WGEN1 = 1; # synthesizing waveforms (1mix)
$LTST1 = 1; # computing log prob on test set (1mix)
1;
Jump to Line
Something went wrong with that request. Please try again.