Home | History | Annotate | Download | only in en.us
      1 # this is the telematics grammar test, grammar is fixed
      2 # default models
      3 cmdline.modelfiles	     = models/generic11_f.swimdl models/generic11_m.swimdl
      4 cmdline.arbfile	     = models/generic.swiarb
      5 cmdline.tcp          = CMDLINE.TCPFILE
      6 cmdline.lda		= models/generic11.lda
      7 #
      8 cmdline.modelfiles11       = models/generic11_f.swimdl models/generic11_m.swimdl
      9 cmdline.modelfiles8       = models/generic8_f.swimdl models/generic8_m.swimdl
     10 cmdline.lda11		= models/generic11.lda
     11 cmdline.lda8		= models/generic8.lda
     12 #
     13 cmdline.vocabulary	= dictionary/cmu6plus.ok.zip
     14 #cmdline.vocabulary	= dictionary/large.ok
     15 #
     16 cmdline.datapath     = \\silicon2\D\\visteon_en_us\\train\\wave
     17 cmdline.results	     = recog4.res;
     18 cmdline.use_image	= 2;
     19 cmdline.detail_res	 = YES;
     20 cmdline.bgsniff      = 25;
     21 
     22 # beginning of speech detection stuff
     23 cmdline.bgsniff_min     = 4;
     24 # 1 means yes do start-pointing
     25 cmdline.gatedmode    = 1;
     26 
     27 # level-based end of speech detection stuff
     28 cmdline.silence_duration_in_frames = 100;
     29 cmdline.end_of_utterance_hold_off_in_frames = 30;
     30 
     31 # logging
     32 cmdline.DataCaptureDirectory = logs
     33 # OSI Log levels (bit set indicates level is ON)
     34 # 0 no logging
     35 # BIT 0 -> BASIC logging
     36 # BIT 1 -> AUDIO waveform logging
     37 # BIT 2 -> ADD WORD logging
     38 # e.g. value is 3 = BASIC+AUDIO logging, no ADDWORD
     39 SREC.Recognizer.osi_log_level = 0
     40 SREC.Recognizer.utterance_timeout = 400
     41 
     42 CREC.ParVersion         	= 1.0 ;
     43 CREC.useCREClogger = 1;
     44 
     45 CREC.Acoustic.dimen     	= 36 ;
     46 CREC.Acoustic.skip      	= 5 ;
     47 CREC.Acoustic.stay      	= 5 ;
     48 CREC.Acoustic.durscale  	= 5 ;
     49 CREC.Acoustic.minvar    	= 2860 ;
     50 CREC.Acoustic.maxvar    	= 2860 ;
     51 CREC.Acoustic.frame_period = 20 ;
     52 CREC.Acoustic.load_models	= non_generic;
     53 
     54 CREC.Frontend.mel_dim             = 12 ;
     55 CREC.Frontend.samplerate          = 11025 ;
     56 CREC.Frontend.premel              = 0.9 ;
     57 CREC.Frontend.lowcut              = 125 ;
     58 CREC.Frontend.highcut             = 5500 ;
     59 CREC.Frontend.window_factor       = 2 ;
     60 CREC.Frontend.offset		  = 0 ;
     61 CREC.Frontend.ddmel               = YES ;
     62 CREC.Frontend.peakdecayup         = 0.3 ;
     63 CREC.Frontend.peakdecaydown       = 0.7 ;
     64 CREC.Frontend.do_skip_even_frames = YES ;
     65 CREC.Frontend.melA 	= 14 45 60 70 95 115 115 135 135 155 160 180 ;
     66 CREC.Frontend.melB	= 42 110 105 110 140 140 150 120 150 130 140 130 ;
     67 CREC.Frontend.dmelA	= 50 150 290 320 400 500 500 600 600 700 720 750 ;
     68 CREC.Frontend.dmelB	= 127 127 127 127 127 127 127 127 127 127 127 127 ;
     69 CREC.Frontend.ddmelA 	= 4 12 22 27 32 35 35 45 45 55 57 62 ;
     70 CREC.Frontend.ddmelB	= 127 127 127 127 127 127 127 127 127 127 127 127 ;
     71 # BOS detection
     72 CREC.Frontend.speech_detect	  = 14 ;
     73 CREC.Frontend.ambient_within	  = 7 ;
     74 CREC.Frontend.speech_above	  = 18 ;
     75 CREC.Frontend.start_windback      = 50 ;
     76 CREC.Frontend.utterance_allowance = 40 ;
     77 
     78 CREC.Frontend.swicms.forget_factor = 400 ;
     79 CREC.Frontend.swicms.sbindex       = 100 ;
     80 CREC.Frontend.swicms.inutt.forget_factor2 = 40 ;
     81 CREC.Frontend.swicms.inutt.disable_after = 200;
     82 CREC.Frontend.swicms.inutt.enable_after = 10;
     83 
     84 CREC.Pattern.dimen              = 28 ;
     85 CREC.Pattern.mix_score_scale    =  0.46 ;
     86 CREC.Pattern.imelda_scale	= 14 ;
     87 
     88 # grammar based EOS detection params
     89 CREC.Recognizer.max_frames = 1000;
     90 CREC.Recognizer.eou_threshold     = 120 ;
     91 CREC.Recognizer.terminal_timeout  = 30 ;
     92 CREC.Recognizer.optional_terminal_timeout = 45 ;
     93 CREC.Recognizer.non_terminal_timeout     = 90 ;
     94 
     95 # for the recognition search
     96 CREC.Recognizer.max_fsm_arcs           = 25000;
     97 CREC.Recognizer.max_fsm_nodes          = 14500;
     98 
     99 CREC.Recognizer.max_hmm_tokens         = 400
    100 CREC.Recognizer.max_word_tokens        = 2000;
    101 CREC.Recognizer.max_altword_tokens     = 400;
    102 CREC.Recognizer.max_fsmnode_tokens     = 400
    103 CREC.Recognizer.viterbi_prune_thresh   = 400
    104 CREC.Recognizer.num_wordends_per_frame = 10
    105 CREC.Recognizer.max_model_states       = 3600
    106 ## C:/users/dahan/esr/baseline/bin/srectestD.exe -parfile ./expr_large.par -grammar recog_nm/namesnnumsSC_dyn,addWords=1000 
    107 
    108 SREC.Confidence.sigmoid_param.gdiff.one_nbest    =  0.003    -3.15  0.05
    109 SREC.Confidence.sigmoid_param.gdiff.many_nbest   =  0.001    -2.21  0.2105
    110 SREC.Confidence.sigmoid_param.sd.one_nbest       =  0.0       0.0   0.0
    111 SREC.Confidence.sigmoid_param.sd.many_nbest      = -0.0161    0.9   0.0526
    112 SREC.Confidence.sigmoid_param.sd13.one_nbest     =  0.0       0.0   0.0 
    113 SREC.Confidence.sigmoid_param.sd13.many_nbest    = -0.0141    1.5   0.0526
    114 SREC.Confidence.sigmoid_param.spf.one_nbest      = -0.002     0.4   0.05
    115 SREC.Confidence.sigmoid_param.spf.many_nbest     =  0.02     -8.63  0.3157
    116 SREC.Confidence.sigmoid_param.abs.one_nbest      =  0.0001   -4.5   0.05
    117 SREC.Confidence.sigmoid_param.abs.many_nbest     =  0.000031 -1.67  0.0526
    118 SREC.Confidence.sigmoid_param.gdiffpf.one_nbest  =  0.33     -5.5   0.85
    119 SREC.Confidence.sigmoid_param.gdiffpf.many_nbest =  0.24     -3.59  0.3157
    120 
    121 # for G2P module
    122 G2P.Available   = YES
    123 G2P.Data        = g2p/en-US-ttp.data
    124