voxforge.org
VoxForge Dev

root/Trunk/Scripts/AcousticModel_scripts/HTK/manual_testing/Copy of julian.jconf

Revision 887, 10.8 kB (checked in by kmaclean, 2 years ago)

8kHz:16bit Acoustic Model build

Line 
1 # Copyright (c) 1991-2005 Kawahara Lab., Kyoto University
2 # Copyright (c) 2000-2005 Shikano Lab., Nara Institute of Science and Technology
3 # Copyright (c) 2005      Julius project team, Nagoya Institute of Technology
4 # All rights reserved
5 #
6 # Example of Runtime Configuration File for Julian rev.3.5
7 #
8 # 1) NOTICE: relative paths must be relative to THIS FILE.
9 #            Current working directory does not affect.
10 # 2) Blank lines and comments after '#' are ignored.
11 #    Use `\#' to specify `#' in an argument,
12 # 3) Each line should be shorter than 512 bytes.
13 # 4) Syntax of each arguments are same as corresponding command options.
14 # 5) The commented-out values in this file are default values in Julian.
15 #
16
17 ######################################################################
18 #### Files
19 ######################################################################
20 ##
21 ## Grammar definition file (DFA and dictionary)
22 ##
23
24 #### There are three ways to specify the grammar files.
25 #### (1) and (2) can be used multiple times.
26
27 #### (1) Specify by common prefix of .dfa and .dict files. Comma-separated
28 #### prefixes can be specified for multiple grammar recognition
29 #-gram /cdrom/testrun/sample_grammars/vfr/vfr
30
31 #### (2) Or you can give Julian a text file which contains list of grammar
32 #### prefixes one per line.
33 #-gramlist file
34
35 #### (3) Classic way to specify a grammar.
36 -dfa sample.dfa
37 -v sample.dict
38
39 #### If you want to clear previously specified grammars, use this at the
40 #### point.
41 #-nogram
42
43 ##
44 ## Acoustic HMM file
45 ##
46 # support ascii hmmdefs or binary format (converted by "mkbinhmm")
47 # format (ascii/binary) will be automatically detected
48 -h ../acoustic_model_files/hmmdefs
49
50 ## triphone model needs HMMList that maps logical triphone to physical ones.
51 -hlist ../acoustic_model_files/tiedlist
52
53 ######################################################################
54 #### Multiple grammar recognition
55 ######################################################################
56 #-multigramout          # Output results for each grammar
57
58 ######################################################################
59 #### Language Model
60 ######################################################################
61 ##
62 ## word insertion penalty
63 ##
64 #-penalty1 0.0          # first pass
65 #-penalty2 0.0          # second pass
66
67 ######################################################################
68 #### Dictionary
69 ######################################################################
70 ##
71 ## do not giveup startup on error words
72 ##
73 #-forcedict
74
75 ######################################################################
76 #### Acoustic Model
77 ######################################################################
78 ##
79 ## Context-dependency handling will be enabled according to the model type.
80 ## Try below if julius wrongly detect the type of hmmdefs
81 ##
82 #-no_ccd                # disable context-dependency handling
83 #-force_ccd             # enable context-dependency handling
84
85 ##
86 ## If julius go wrong with checking parameter type, try below.
87 ##
88 #-notypecheck
89 #
90
91 ##
92 ## (PTM/triphone) switch computation method of IWCD on 1st pass
93 ##
94 #-iwcd1 best N  # assign average of N-best likelihood of the same context
95 #-iwcd1 max     # assign maximum likelihood of the same context
96 #-iwcd1 avg     # assign average likelihood of the same context (default)
97
98 ######################################################################
99 #### Gaussian Pruning
100 ######################################################################
101 ## Number of mixtures to select in a mixture pdf.
102 ## This default value is optimized for IPA99's PTM,
103 ## with 64 Gaussians per codebook
104 #-tmix 2
105
106 ## Select Gaussian pruning algorithm
107 ## defulat: beam (standard setting), safe (others)
108 #-gprune safe           # safe pruning, accurate but slow
109 #-gprune heuristic      # heuristic pruning
110 #-gprune beam           # beam pruning, fast but sensitive
111 #-gprune none           # no pruning
112
113 ######################################################################
114 #### Gaussian Mixture Selection
115 ######################################################################
116 #-gshmm hmmdefs         # monophone HMM for GMS
117                         # (OFF when not specified)
118 #-gsnum 24              # number of states to be selected on GMS
119
120 ######################################################################
121 #### Search Parameters
122 ######################################################################
123 #-b 400                 # beam width on 1st pass (#nodes) for monophone
124 #-b 800                 # beam width on 1st pass (#nodes) for triphone,PTM
125 #-b 1000                # beam width on 1st pass (#nodes) for triphone,PTM,engine=v2.1
126 #-b2 30                 # beam width on 2nd pass (#words)
127 #-sb 80.0               # score beam envelope threshold
128 #-s 500                 # hypotheses stack size on 2nd pass (#hypo)
129 #-m 2000                # hypotheses overflow threshold (#hypo)
130 #-lookuprange 5         # lookup range for word expansion (#frame)
131 #-n 1                   # num of sentences to find (#sentence)
132 #-n 10                  #   (default for 'standard' configuration)
133 #-output 1              # num of found sentences to output (#sentence)
134 #-looktrellis           # search within only backtrellis words
135
136 ######################################################################
137 #### Inter-word Short Pause Handling
138 ######################################################################
139 ##
140 ## Specify short pause model name to be treated as special
141 ##
142 #-spmodel "sp"          # HMM model name
143
144 ##
145 ## For insertion of context-free short-term inter-word pauses between words
146 ##  (multi-path version only)
147 ##
148 #-iwsp                  # append a skippable sp model at all word ends
149 #-iwsppenalty 0.0       # transition penalty for the appenede sp models
150
151 ######################################################################
152 #### Speech Input Source
153 ######################################################################
154 ## select one (default: mfcfile)
155 #-input mfcfile         # MFCC file in HTK parameter file format
156 #-input rawfile         # raw wavefile (auto-detect format)
157                         # WAV(16bit) or
158                         # RAW(16bit(signed short),mono,big-endian)
159                         # AIFF,AU (with libsndfile extension)
160                         # other than 16kHz, sampling rate should be specified
161                         # by "-smpFreq" option
162 #-input mic             # direct microphone input
163                         # device name can be specified via env. val. "AUDIODEV"
164 #-input netaudio -NA host:0    # direct input from DatLink(NetAudio) host
165 #-input adinnet -adport portnum # via adinnet network client
166 #-input stdin           # from standard tty input (pipe)
167
168 #-filelist filename     # specify file list to be recognized in batch mode
169
170 #-nostrip               # switch OFF dropping of invalid input segment.
171                         # (default: strip off invalid segment (0 sequence etc.)
172 #-zmean                 # enable DC offset removal (invalid for mfcfile input)
173
174 ######################################################################
175 #### Recording
176 ######################################################################
177 #-record directory      # auto-save recognized speech data into the dir
178
179 ######################################################################
180 #### GMM-based Input Verification and Rejection
181 ######################################################################
182 #-gmm gmmdefs           # specify GMM definition file in HTK format
183 #-gmmnum 10             # num of Gaussians to be computed per mixture
184 #-gmmreject "noise,laugh,cough" # list of GMM names to be rejected
185
186 ######################################################################
187 #### Too Short Input Rejection
188 ######################################################################
189 #-rejectshort 800       # reject input shorter than specified millisecond
190
191 ######################################################################
192 #### Speech Detection
193 ######################################################################
194 #-pausesegment          # turn on speech detection by level and zero-cross
195 #-nopausesegment        # turn off speech detection by level and zero-cross
196                         # (default: on for mic or adinnet, off for file)
197 #-lv 2000               # threshold of input level (0-32767)
198 #-headmargin 300        # head margin of input segment (msec)
199 #-tailmargin 400        # tail margin of input segment (msec)
200 #-zc 60                 # threshold of number of zero-cross in a second
201
202 ######################################################################
203 #### Acoustic Analysis
204 ######################################################################
205 -smpFreq 8000           # sampling rate (Hz)
206 #-smpPeriod 625         # sampling period (ns) (= 10000000 / smpFreq)
207 #-fsize 400             # window size (samples)
208 #-fshift 160            # frame shift (samples)
209 #-delwin 2              # delta window (frames)
210 #-hifreq -1             # cut-off hi frequency (Hz) (-1: disable)
211 #-lofreq -1             # cut-off low frequency (Hz) (-1: disable)
212 #-cmnsave filename      # save CMN param to file (update per input)
213 #-cmnload filename      # load initial CMN param from file on startup
214
215 ######################################################################
216 #### Spectral Subtraction (SS)
217 ######################################################################
218 #-sscalc                # do SS using head silence (file input only)
219 #-sscalclen 300         # length of head silence for SS (msec)
220 #-ssload filename       # load constant noise spectrum from file for SS
221 #-ssalpha 2.0           # alpha coef. for SS
222 #-ssfloor 0.5           # spectral floor for SS
223
224 ######################################################################
225 #### Forced alignment
226 ######################################################################
227 #-walign                # do forced alignment with result per word
228 #-palign                # do forced alignment with result per phoneme
229 #-salign                # do forced alignment with result per HMM state
230
231 ######################################################################
232 #### Word Confidence Scoring
233 ######################################################################
234 #-cmalpha 0.05          # smoothing coef. alpha
235
236 ######################################################################
237 #### Output
238 ######################################################################
239 #-separatescore         # output language and acoustic score separately
240 #-progout               # output partial result per a time interval
241 #-proginterval 300      # time interval for "-progout" (msec)
242 #-quiet                 # output minimal result
243 #-demo                  # = "-progout -quiet", suitable for dictation demo
244 #-debug                 # output full message for debug
245 #-charconv from to      # output character set conversion (see manual for
246                         # available code set name)
247
248 ######################################################################
249 #### Server module mode
250 ######################################################################
251 #-module                # Run Julius on "Server module mode"
252 #-module 5530           # (when using another port number for connection)
253 #-outcode WLPSC         # select output message toward module (WLPSCwlps)
254
255 ######################################################################
256 #### Misc.
257 ######################################################################
258 #-help                  # output help and exit
259 #-setting               # output engine configuration and exit
260 #-C jconffile           # expand other jconf file in its place
261
262 ################################################################# end of file
Note: See TracBrowser for help on using the browser.