Advertisement
Guest User

Untitled

a guest
May 30th, 2012
1,334
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
text 41.54 KB | None | 0 0
  1. <?xml version="1.0"?> <!-- XML version -->
  2. <?xml-stylesheet type="text/xsl" href="SWIrecConfig.xsl"?>
  3.  
  4. <!--
  5.  
  6. ****************************License********************************
  7.  
  8. Copyright (c) 1995-2006 by Nuance Communications, Inc. All rights reserved.
  9.  
  10. Nuance, Inc. provides this document without representation or warranty of
  11. any kind. Nuance, Inc. reserves the right to revise this document and to
  12. change the information contained in this document without further notice.
  13.  
  14. Dialog Modules, OpenSpeech, Productivity Without Boundaries, ScanSoft, the
  15. ScanSoft logo, SMARTRecognizer, SpeechCare, Speechify, SpeechSecure,
  16. SpeechSpot, SpeechSite, SpeechWorks, the SpeechWorks logo, and SpeechWorksHere
  17. are trademarks or registered trademarks of Nuance Communications, Inc. or its
  18. licensors in the United States and/or other countries. This document may also
  19. contain other trademarks, which are the property of their respective owners.
  20.  
  21. Without limiting the rights under copyright reserved above, no part of this
  22. document may be reproduced, stored in or introduced into a retrieval system,
  23. or transmitted in any form or by any means, including, without limitation,
  24. electronic, mechanical, photocopying, recording, or otherwise, without the
  25. prior written permission of Nuance Communications, Inc.
  26.  
  27. -->
  28.  
  29. <!-- Define the structure for the XML -->
  30.  
  31. <!DOCTYPE SWIrecConfig SYSTEM "SWIrecConfig.dtd">
  32.  
  33.  
  34. <!-- *************** Organization of Config Parameters ************* -->
  35.  
  36. <!-- * Parameters related to INITIALIZATION * -->
  37. <!-- * Parameters related to CACHING * -->
  38. <!-- * Parameters related to ENDPOINTER * -->
  39. <!-- * Parameters related to LEARN * -->
  40. <!-- * Parameters related to ACCURACY AND LANGUAGE MODELING * -->
  41. <!-- * Parameters related to PERFORMANCE * -->
  42. <!-- * Parameters related to DEBUGGING * -->
  43. <!-- * NEVER CHANGE WITHOUT Nuance authorization * -->
  44.  
  45.  
  46. <SWIrecConfig version="1.0.0">
  47. <lang name="default">
  48.  
  49.  
  50.  
  51. <!-- ***************************************************************** -->
  52. <!-- * Parameters related to INITIALIZATION * -->
  53. <!-- ***************************************************************** -->
  54.  
  55. <!-- 1:enable speech mode in rec result when NOMATCH; 0:disable this mode -->
  56. <param name="swirec_result_enable_speech_mode">
  57. <value>0</value>
  58. </param>
  59.  
  60. <!-- 0:include "*#ABCD" in DTMF builtin grammars; 1:exclude "*#ABCD" -->
  61. <param name="swirec_builtin_grammar_full_dtmf_mode">
  62. <value>0</value>
  63. </param>
  64.  
  65. <!-- Controls how long the recognizer should wait after the end of
  66. the prompt for the caller to speak. -->
  67. <param name="timeout">
  68. <value>7000</value>
  69. </param>
  70.  
  71. <!-- Controls how much silence (milliseconds) after a successful recognition
  72. is needed to conclude that a caller is finished. -->
  73. <param name="completetimeout">
  74. <value>0</value>
  75. </param>
  76.  
  77. <!-- Controls the level of confidence to determine when the
  78. application needs to confirm. Values 0-1000. -->
  79. <param name="confidencelevel">
  80. <value>0</value>
  81. </param>
  82.  
  83. <!-- Controls the length (milliseconds) of a period of silence after
  84. callers have spoken to conclude that they finished. This timer is
  85. also known as the &quot;after end of speech&quot; timer.
  86. For optimal performance, set this parameter per grammar, as follows:
  87. 500 for short utterances (yes/no, hot word)
  88. 750 for simple queries
  89. 1200 to 2500 For digit strings and long utterances (listings) -->
  90. <param name="incompletetimeout">
  91. <value>2500</value>
  92. </param>
  93.  
  94. <param name="swirec_retain_grammar_import_separator">
  95. <value>0</value>
  96. </param>
  97.  
  98. <param name="swirec_waveform_logging_uniform_name">
  99. <value>0</value>
  100. </param>
  101.  
  102. <!-- Controls sensitivity of the speech detector when
  103. looking for speech. -->
  104. <param name="sensitivity">
  105. <value>0.5</value>
  106. </param>
  107.  
  108. <!-- Controls the trade-off between processing and accuracy. -->
  109. <param name="speedvsaccuracy">
  110. <value>0</value>
  111. </param>
  112.  
  113. <!-- Sets the confidence threshold for recognition results
  114. computed while the selective_barge_in mode is active. -->
  115. <param name="swirec_selective_barge_in_conf_thresh">
  116. <value>700</value>
  117. </param>
  118.  
  119. <!-- Sets the confidence threshold for recognition results
  120. computed while the magic word endpointer mode is active. -->
  121. <param name="swirec_magic_word_conf_thresh">
  122. <value>700</value>
  123. </param>
  124.  
  125. <!-- For Nuance use only. Sets mode of the INTERNAL endpointer. -->
  126. <!-- OSR sets this param as needed for different audio input. -->
  127. <!-- For example, Aurora data requires that the endpointer be disabled. -->
  128. <param name="swirec_internal_endpointer_mode">
  129. <value>end_only</value>
  130. </param>
  131.  
  132. <!-- This parameter is ignored and is reserved for future use. -->
  133. <param name="swirec_audio_environment">
  134. <value>default</value>
  135. </param>
  136.  
  137. <!-- Amount of speech, in milliseconds, that the
  138. recognizer sees before forcing end of speech. -->
  139. <param name="swirec_max_speech_duration">
  140. <value>40000</value>
  141. </param>
  142.  
  143. <!-- Number of entries to return in the nbest list. If &gt;5, additional
  144. CPU cycles will be needed. -->
  145. <param name="swirec_nbest_list_length">
  146. <value>2</value>
  147. </param>
  148.  
  149. <!-- Defines the format of the audio being supplied to the recognizer. -->
  150. <param name="swirec_audio_media_type">
  151. <value>audio/basic;rate=8000</value>
  152. <value>audio/x-alaw-basic;rate=8000</value>
  153. <!-- value&gt;application/x-feature;rate=8000;encoding=speechpearl&lt;/value -->
  154. </param>
  155.  
  156. <!-- Controls whether to log the SWIrslt event -->
  157. <param name="swirec_log_xmlresult">
  158. <value>true</value>
  159. </param>
  160.  
  161. <!-- Add a Nuance grammar key to the XML result. -->
  162. <param name="swirec_extra_nbest_keys">
  163. <value>SWI_meaning</value>
  164. <value>SWI_literal</value>
  165. <value>SWI_grammarName</value>
  166. </param>
  167.  
  168. <!-- Ignore the media type that is returned by the server
  169. upon fetching a grammar. -->
  170. <param name="swirec_ignore_grammar_media_type">
  171. <value>1</value>
  172. </param>
  173.  
  174. <!-- log grammarID in the GRNM token of SWIrcst event -->
  175. <param name="swirec_enable_grammar_id_logging">
  176. <value>0</value>
  177. </param>
  178.  
  179.  
  180. <!-- Max parses evaluated for each literal and grammar
  181. Valid values are 1-99 -->
  182.  
  183. <param name="swirec_max_parses_per_literal">
  184. <value>10</value>
  185. </param>
  186.  
  187. <!-- Set of characters that are allowed in a sampa pronunciation -->
  188.  
  189. <param name="swirec_sampa_characters">
  190. <value>#123459:;=?@ACDEHIJMNOQRSTUVYZ_abdefghijklmnoprstuvwxyz{~</value>
  191. </param>
  192.  
  193. <!-- Max source grammar size (in bytes) that is allowed to be loaded
  194. by the online system or non-sgc tools -->
  195. <param name="swirec_max_source_grammar_size">
  196. <value>-1</value>
  197. </param>
  198.  
  199. <!-- Max training grammar size (in bytes) that is allowed to be loaded
  200. by the online system or non-sgc tools -->
  201. <param name="swirec_max_training_grammar_size">
  202. <value>-1</value>
  203. </param>
  204.  
  205. <!-- For Nuance use only: Set this to 0 to enable support for answer grammars -->
  206. <param name="swirec_suppress_answer_grammar">
  207. <value>1</value>
  208. </param>
  209.  
  210.  
  211.  
  212. <!-- ****************************************************************** -->
  213. <!-- * New License Enforcement initialization parameters * -->
  214. <!-- ****************************************************************** -->
  215.  
  216. <!-- How many osr_swirec licenses will be checked out during SWIrecInit() -->
  217. <param name="swirec_license_ports">
  218. <value>4</value>
  219. </param>
  220.  
  221. <!-- How many osr_swiep licenses will be checked out during SWIepInit() -->
  222. <param name="swiep_license_ports">
  223. <value>4</value>
  224. </param>
  225.  
  226. <!-- Identifies a threshold of licenses, above which will be considered an overdraft. -->
  227. <param name="swirec_license_ports_overdraft_thresh">
  228. <value>-1</value>
  229. </param>
  230.  
  231. <!-- Identifies a threshold of licenses, above which will be considered an overdraft. -->
  232. <param name="swiep_license_ports_overdraft_thresh">
  233. <value>-1</value>
  234. </param>
  235.  
  236. <!-- Identifies the features to be checked out by the recognizer -->
  237. <param name="swirec_licensing_features">
  238. <value>osr_nl_u, osr_rec_u, dtmf</value>
  239. </param>
  240.  
  241. <!-- Identifies the features to be checked out by the endpointer -->
  242. <param name="swiep_licensing_features">
  243. <value/>
  244. </param>
  245.  
  246. <!-- Upon detection of network communicate failure with license server, wait grace
  247. period milliseconds before disabling features; maximum 3600 -->
  248. <param name="swilicense_grace_period">
  249. <value>3600</value>
  250. </param>
  251.  
  252. <!-- ***************************************************************** -->
  253. <!-- * Parameters related to CACHING * -->
  254. <!-- ***************************************************************** -->
  255.  
  256. <!-- Amount of memory the internal cache needs to take up before we
  257. start expiring grammars, in MB -->
  258. <param name="swirec_memory_cache_size">
  259. <value>100</value>
  260. </param>
  261.  
  262. <!-- When maximum cache size is reached, what must the cache size be
  263. reduced to to stop expiring grammars, in MB. Defaults to 85% of
  264. above size -->
  265. <!--
  266. &lt;param name=&quot;swirec_memory_cache_low_water_mark&quot;&gt;
  267. &lt;value&gt;34&lt;/value&gt;
  268. &lt;/param&gt;
  269. -->
  270.  
  271. <!-- Minimum size of compiled grammar to cache in KB -->
  272. <param name="swirec_memory_cache_min_entry_size">
  273. <value>0</value>
  274. </param>
  275.  
  276. <!-- Level to compile newly cached grammars -->
  277. <param name="swirec_default_optimization">
  278. <value>6</value>
  279. </param>
  280.  
  281. <!-- Level to compile often-used grammars -->
  282. <param name="swirec_full_optimization">
  283. <value>9</value>
  284. </param>
  285.  
  286. <!-- Defines &quot;often-used&quot; grammar. It is the number of times
  287. a grammar is accessed from a cache before the
  288. grammar is automatically optimized using the level
  289. in swirec_disk_cache_full_optimization -->
  290. <param name="swirec_hits_before_full_optimize">
  291. <value>3</value>
  292. </param>
  293.  
  294. <!-- User dictionary cache size in MB. The default value is 0 i.e. caching is disabled by default. -->
  295. <param name="swirec_max_dict_cache_size">
  296. <value>0</value>
  297. </param>
  298.  
  299. <!-- Defines whether the disk cache should be used. -->
  300. <param name="swirec_disk_cache_enabled">
  301. <value>1</value>
  302. </param>
  303.  
  304. <!-- Directory name for the disk cache. -->
  305. <!-- If relative, the file path is relative to the containing configuration file. -->
  306. <param name="swirec_disk_cache_directory">
  307. <value>../GrammarCache</value>
  308. </param>
  309.  
  310. <!-- Maximum size of the disk cache in MB -->
  311. <param name="swirec_disk_cache_size">
  312. <value>500</value>
  313. </param>
  314.  
  315. <!-- Minimum size of compiled grammar to cache in KB -->
  316. <param name="swirec_disk_cache_min_entry_size">
  317. <value>0</value>
  318. </param>
  319.  
  320. <!-- When maximum cache size is reached, what must the cache size be
  321. reduced to to stop expiring grammars, in MB. -->
  322. <param name="swirec_disk_cache_low_water_mark">
  323. <value>400</value>
  324. </param>
  325.  
  326. <!-- Address a http proxy server to use, e.g. 127.0.0.1 -->
  327. <param name="swirec_inet_proxy_server">
  328. <value/>
  329. </param>
  330.  
  331. <!-- Port of the http proxy server to use, e.g. &quot;8080&quot;;
  332. set this only if swirec_inet_proxy_server is set -->
  333. <param name="swirec_inet_proxy_server_port">
  334. <value/>
  335. </param>
  336.  
  337. <!-- Delimiters which are used to separate fields in a grammar
  338. key value query string. The default is &quot;;&amp;&quot;, to allow &quot;x=y;z=d&quot; or
  339. &quot;x=y&amp;z=d&quot; -->
  340. <param name="swirec_inet_query_delimiters">
  341. <value>;&amp;</value>
  342. </param>
  343.  
  344. <!-- Table of translations from grammar language code to internal one -->
  345. <!-- If relative, this file path is relative to baseline (SWISRSDK). -->
  346. <param name="swirec_language_translation_table">
  347. <value>generic/langtable.text</value>
  348. </param>
  349.  
  350.  
  351. <!-- ***************************************************************** -->
  352. <!-- * Parameters related to ENDPOINTER * -->
  353. <!-- ***************************************************************** -->
  354.  
  355. <!-- This parameter is ignored and is reserved for future use. -->
  356. <param name="swiep_audio_environment">
  357. <value>default</value>
  358. </param>
  359.  
  360. <!-- Backoff is a safety margin to ensure the begin-of-speech is captured.
  361. The margin extends the BOS marker slightly (milliseconds) sooner in
  362. the audio sample. -->
  363. <param name="swiep_BOS_backoff">
  364. <value>200</value>
  365. </param>
  366.  
  367. <!-- Backoff is a safety margin to ensure the end-of-speech is captured.
  368. The margin extends the EOS marker slightly (milliseconds) later in
  369. the audio sample. -->
  370. <param name="swiep_EOS_backoff">
  371. <value>240</value>
  372. </param>
  373.  
  374. <!-- Inform the speech detector about the audio format being
  375. supplied to the recognizer. -->
  376. <param name="swiep_audio_media_type">
  377. <value>audio/basic;rate=8000</value>
  378. <value>audio/x-alaw-basic;rate=8000</value>
  379. </param>
  380.  
  381. <!-- Controls how loudly the caller must speak to interrupt
  382. prompts (barge-in) in order for speech to be detected. -->
  383. <param name="swiep_in_prompt_sensitivity_percent">
  384. <value>50</value>
  385. </param>
  386.  
  387. <!-- Turns barge-in on/off. If a dialog state is not using barge-in, then set this parameter to 0.
  388. The input received by the endpointer differs depending on whether barge-in is enabled or not.
  389. When barge-in is enabled, the ratio of silence to speech sent to the endpointer increases
  390. considerably; also, the sound that follows the first recognition call is usually the residual
  391. prompt or background noise. When barge-in is not enabled, the first sound processed is usually
  392. the callers speech. Setting this parameter ensures that the endpointer is optimized
  393. for either condition.
  394. -->
  395. <param name="bargein">
  396. <value>1</value>
  397. </param>
  398.  
  399. <!-- Sets the speech detector into various endpointer modes. -->
  400. <param name="swiep_mode">
  401. <value>begin_only</value>
  402. </param>
  403.  
  404. <!-- Must be set if SWIepRead is used by platform -->
  405. <param name="swiep_use_swiep_read">
  406. <value>1</value>
  407. </param>
  408.  
  409. <!-- Disable pre-endpointed waveform logging entirely. -->
  410. <param name="swiep_suppress_waveform_logging">
  411. <value>1</value>
  412. </param>
  413.  
  414. <!-- Disable logging of endpointer events. -->
  415. <param name="swiep_suppress_event_logging">
  416. <value>0</value>
  417. </param>
  418.  
  419. <!-- Max channels to simultaneously save pre-endpointed waveforms. -->
  420. <param name="swiep_waveform_logging_max_channels">
  421. <value>-1</value>
  422. </param>
  423.  
  424. <!-- Timeout (seconds) for inactive channel when max_channels
  425. is set -->
  426. <param name="swiep_waveform_logging_channel_timeout">
  427. <value>300</value>
  428. </param>
  429.  
  430. <!-- Prevent thrashing on tiny input buffers, each of which
  431. has a constant fixed cost. Too big hurts response time;
  432. too small increases cpu; 800 recommended for 8khz ulaw
  433. legal values 1 to 1999 -->
  434. <param name="swiep_min_bytes_to_process">
  435. <value>800</value>
  436. </param>
  437.  
  438. <!-- Controls how much memory is spent holding samples waiting for read
  439. to catch up to write; in msecs -->
  440. <param name="swiep_max_read_lag">
  441. <value>10000</value>
  442. </param>
  443.  
  444. <!-- suppresses barge-in for this many msecs; can stop early barge-ins -->
  445. <param name="swiep_suppress_barge_in_time">
  446. <value>0</value>
  447. </param>
  448.  
  449. <!-- ***************************************************************** -->
  450. <!-- * Advanced endpointer configuration -->
  451. <!-- * In general, you should not need to adjust these parameters; the -->
  452. <!--* endpointer is optimized to provide the best performance with -->
  453. <!--* default settings. Nuance will continue to revamp these settings -->
  454. <!--* based on field results. -->
  455. <!-- ***************************************************************** -->
  456.  
  457. <!-- ** Start of the call
  458. Nuance provides parameters that allow the endpointer to reject speech-like residual
  459. echoes, which are typically strongest at the start of the call. ** -->
  460.  
  461. <!-- This parameter specifies the speech level (on a dBm scale) of the most quiet utterance
  462. that can trigger the endpointer at the start of the first recognition. This parameter keeps
  463. the endpointer from being triggered by prompt echoes at the beginning of the first recognition,
  464. before the echo cancellation might have converged. This minimum level gradually decreases to
  465. the value specified by swiep_bargein_min_noise_floor according to the timing values specified by
  466. swiep_bargein_initial_hold_seconds and swiep_bargein_initial_decay_seconds. This parameter is used only
  467. when bargein is set to 1. -->
  468. <param name="swiep_bargein_initial_noise_floor">
  469. <value>-25</value>
  470. </param>
  471.  
  472. <!-- This parameter specifies how long (in seconds) the initial noise floor set by
  473. swiep_bargein_initial_noise_floor is held. After this time, the initial noise floor starts
  474. to transition to the value specified in swiep_bargein_min_noise_floor. The transition lasts for the
  475. duration specified in swiep_bargein_initial_decay_seconds. This parameter is used only when bargein
  476. is set to 1. -->
  477. <param name="swiep_bargein_initial_hold_seconds">
  478. <value>1.5</value>
  479. </param>
  480.  
  481. <!-- This parameter specifies the duration (in seconds) during which the minimum noise floor transitions
  482. from the value specified in swiep_bargein_initial_noise_floor to the value specified in
  483. swiep_bargein_min_noise_floor. This parameter is used only when bargein is set to 1. -->
  484. <param name="swiep_bargein_initial_decay_seconds">
  485. <value>0.5</value>
  486. </param>
  487.  
  488. <!-- This parameter specifies whether to automatically truncate the initial hold time when
  489. the endpointer is notified that the prompt has completed -->
  490. <param name="swiep_stop_initial_hold_on_prompt_done">
  491. <value>1</value>
  492. </param>
  493.  
  494. <!-- This parameter specifies the absolute minimum level of speech (on a dBm scale) that can trigger
  495. the endpointer. This parameter is always used, regardless of the value in parameter bargein. -->
  496. <param name="swiep_bargein_min_noise_floor">
  497. <value>-45</value>
  498. </param>
  499.  
  500. <!-- Detection sensitivity
  501. generalized sensitivity settings are offered through 'sensitivity' and 'swiep_in_prompt_sensitivity_percent'.
  502. Sensitivity can be fine-tuned through adjustment of parameters in this section. -->
  503.  
  504. <!-- Set this parameter to 0 to disable 'sensitivity' and 'swiep_in_prompt_sensitivity_percent'
  505. before tuning the remaining parameters in this section.
  506. -->
  507. <param name="swiep_use_sensitivity">
  508. <value>1</value>
  509. </param>
  510.  
  511. <!-- This parameter is the primary parameter controlling the sensitivity of the endpointer.
  512. Increasing it requires a larger change in energy to trigger the endpointer, and decreasing
  513. it makes the endpointer more sensitive. -->
  514. <param name="swiep_threshold_snr">
  515. <value>14</value>
  516. </param>
  517.  
  518. <!-- The value of this parameter is added to the threshold specified by parameter
  519. swiep_threshold_snr to detect the first start-of-speech in a call. A larger positive
  520. number increases the detection threshold for the first utterance. After one successful
  521. recognition, this parameter is ignored. This parameter does not apply to the detection of
  522. end-of-speech -->
  523. <param name="swiep_threshold_snr_first_offset">
  524. <value>3</value>
  525. </param>
  526.  
  527. <!-- The value of this parameter is applied to the threshold specified by parameter
  528. swiep_threshold_snr to detect the end-of-speech. A larger negative number makes it
  529. more likely that phrases ending weakly are classified as speech. -->
  530. <param name="swiep_threshold_snr_end_offset">
  531. <value>-3</value>
  532. </param>
  533.  
  534. <!-- The value of this parameter specifies the search range for a smart back-up that
  535. looks for low-energy consonants (msec) -->
  536. <param name="swiep_consonant_search_width">
  537. <value>550</value>
  538. </param>
  539.  
  540. <!-- The value of this parameter specifies the difference between the measured phrase strength
  541. and the minimum strength required to trigger the endpointer, that may represent a consonant. -->
  542. <param name="swiep_consonant_offset">
  543. <value>3</value>
  544. </param>
  545.  
  546. <!-- ** Timing
  547. This section describes new and updated timing parameters used to determine the
  548. begin-of-speech and end-of-speech. ** -->
  549.  
  550. <!-- To trigger the start-of-speech, a certain percentage of frames
  551. (specified by swiep_start_percentage) during a time window
  552. (specified by swiep_start_seconds) must be above the threshold specified by
  553. swiep_threshold_snr. The default values mean that the duration of speech activity required
  554. to determine that speech has started is about 0.045 seconds. -->
  555. <param name="swiep_start_percentage">
  556. <value>0.15</value>
  557. </param>
  558. <param name="swiep_start_seconds">
  559. <value>0.3</value>
  560. </param>
  561.  
  562. <!-- To trigger the end-of-speech, a certain percentage of frames (specified by swiep_end_percentage)
  563. during a time window (specified by incompletetimeout) must be below the detection thresholds. -->
  564. <param name="swiep_end_percentage">
  565. <value>1.0</value>
  566. </param>
  567.  
  568. <!-- ** Adapting speech models
  569. The endpointer keeps an adapting speech model of the signal level for the current caller.
  570. To trigger the endpointer, the current signal must be reasonably close to or above the adapting
  571. speech model. This section describes the parameters that control the adapting speech models.** -->
  572.  
  573. <!-- If the spectral estimate of the input signal is lower than the speech model of the speaker, it
  574. has to be within the threshold specified by this parameter to trigger the endpointer. For example, if
  575. the speech model of the speaker is 46 and parameter swiep_voice_threshold is set to 5, the input signal
  576. must be 41 or higher to trigger the endpointer. Increasing this value (typically to 10) will let more
  577. quiet utterances and weak onsets trigger the endpointer when the speech model for the current caller
  578. is loud. -->
  579. <param name="swiep_voice_threshold">
  580. <value>5</value>
  581. </param>
  582.  
  583. <!-- This parameter provides an initial estimate (on a dBm scale) of how loud the speaker will be.
  584. This is used by the endpointer when comparing the current level of the signal to an internally-adapting
  585. model of the speech frames that have been processed so far. Increasing this parameter can lead to fewer
  586. false triggers, and decreasing it can lead to fewer misses. This parameter is independent of the
  587. swiep_threshold_snr and noise floor-related parameters. -->
  588. <param name="swiep_initial_voice_bin">
  589. <value>-35</value>
  590. </param>
  591.  
  592. <!-- For Nuance use only. -->
  593. <param name="swiep_dbg_verbosity">
  594. <value>0</value>
  595. </param>
  596.  
  597. <!-- ***************************************************************** -->
  598. <!-- * Parameters related to HOT INSERT and Grammar Preloading-->
  599. <!-- ***************************************************************** -->
  600.  
  601. <!--Number of seconds between attempts to update baseline data -->
  602. <param name="swirec_update_interval">
  603. <value>600</value>
  604. </param>
  605.  
  606. <!-- If this file exists, hot insert will NOT be done, use this to
  607. temporarily stop hot insert while a group of files is updated. -->
  608. <param name="swirec_update_lockfile">
  609. <value>lockfile.dat</value>
  610. </param>
  611.  
  612. <!-- If this is set, preloaded grammars will never be removed from
  613. the cache, even if they normally would expire or SWIrecGrammarFree() is called -->
  614. <param name="swirec_lock_preload_grammars">
  615. <value>0</value>
  616. </param>
  617.  
  618. <!-- Set default properties used for SWIrecGrammarLoad,Activate,Free(), See
  619. Properties (VXIinet) in Reference Manual for configurable properties -->
  620. <param name="swirec_default_loadfree_properties">
  621. <value/>
  622. <!-- Example:
  623. <value>swirec_mem_flush_on_free=1</value>
  624. <value>inet.maxage=0</value>
  625. -->
  626. </param>
  627.  
  628.  
  629. <param name="swirec_preload_file">
  630. <value>SWIgrmPreload.xml</value>
  631. </param>
  632.  
  633. <!-- ***************************************************************** -->
  634. <!-- * Parameters related to LEARN * -->
  635. <!-- ***************************************************************** -->
  636.  
  637. <!-- For Nuance use only. -->
  638. <param name="swirec_learn_timeout">
  639. <value/>
  640. </param>
  641.  
  642. <!-- For Nuance use only. -->
  643. <param name="swirec_learn_server">
  644. <value/>
  645. </param>
  646.  
  647. <!-- ***************************************************************** -->
  648. <!-- * Parameters related to ACCURACY AND LANGUAGE MODELING * -->
  649. <!-- ***************************************************************** -->
  650.  
  651. <!-- For Nuance use only. Sets a maximum number of models (e.g. male/female).
  652. Typically never changed. -->
  653. <param name="swirec_num_parallel_models">
  654. <value>2</value>
  655. </param>
  656.  
  657. <!-- Language model scale. Scale used to get language model within same
  658. dynamic range as acoustic models. -->
  659. <param name="swirec_lmweight">
  660. <value>1.0</value>
  661. </param>
  662.  
  663. <!-- For Nuance use only: Weight of lm during rescore phase. Absolute value (not dependent on lmweight). -->
  664. <param name="swirec_lmrescore_weight">
  665. <value>2.0</value>
  666. </param>
  667.  
  668. <!-- For Nuance use only -->
  669. <param name="swirec_max_arc_cost">
  670. <value>6.5</value>
  671. </param>
  672.  
  673. <!-- For Nuance use only -->
  674. <param name="swirec_max_epsilon_arc_cost">
  675. <value>6.0</value>
  676. </param>
  677.  
  678. <!-- ***************************************************************** -->
  679. <!-- * SSM defaults * -->
  680. <!-- ***************************************************************** -->
  681.  
  682. <!-- If confidence of ssm is below this number, do not return result.
  683. Range:0.0-1.0 -->
  684. <param name="swissm_confidence_threshold">
  685. <value>0.0</value>
  686. </param>
  687.  
  688.  
  689. <!-- ***************************************************************** -->
  690. <!-- * Word level confidence parameters * -->
  691. <!-- ***************************************************************** -->
  692.  
  693. <!-- Enabled/Disabled word level confidence estimates -->
  694. <param name="swirec_word_confidence_enabled">
  695. <value>0</value>
  696. </param>
  697.  
  698. <!-- Word posterior pruning. Controls the density of the word lattice
  699. by pruning all word hypothesis with an initial posterior estimate
  700. larger than this value. Also relates to the amount of CPU spent
  701. computing the word lattice an ultimately the word level confidence
  702. estimates -->
  703. <param name="swirec_word_posterior_pruning">
  704. <value>7.0</value>
  705. </param>
  706.  
  707. <!-- Controls the density of the lattice used for computing word consensus
  708. hypothesis. Need to keep this value relatively low to mimize CPU -->
  709. <param name="swirec_word_lattice_density">
  710. <value>100.0</value>
  711. </param>
  712.  
  713. <!-- ***************************************************************** -->
  714. <!-- * Slot level confidence parameters * -->
  715. <!-- ***************************************************************** -->
  716.  
  717. <!-- Used to calculate SP sentence confidence -->
  718. <param name="swirec_slot_confidence_norm_factor">
  719. <value>1.0</value>
  720. </param>
  721.  
  722. <!-- Interpolation factor to combine OSR and SP slot confidence values -->
  723. <param name="swirec_combined_slot_confidence_factor">
  724. <value>1.0</value>
  725. </param>
  726.  
  727. <!-- ***************************************************************** -->
  728. <!-- * Parameters related to PERFORMANCE * -->
  729. <!-- ***************************************************************** -->
  730.  
  731. <!-- Speed vs Accuracy tradeoff. Valid settings are idle, normal, busy, pegged and on.
  732. Other parameters that use one of several values based on the setting of this
  733. parameter will choose their value in the order above (idle=first_value, normal=
  734. second_value, busy=third_value, and pegged=fourth_value.
  735. &quot;On&quot; means the load_adjusted speed vs accuracy is dynamic. -->
  736. <param name="swirec_load_adjusted_speedvsaccuracy">
  737. <value>on</value>
  738. </param>
  739.  
  740. <!-- Maximum number of dictionary pronunciations to use per word. -->
  741. <param name="swirec_max_dict_prons">
  742. <value>8</value>
  743. </param>
  744.  
  745. <!-- Maximum number of automatically generated pronunciations per word. -->
  746. <param name="swirec_max_auto_prons">
  747. <value>1</value>
  748. </param>
  749.  
  750. <!-- For Nuance use only. Controls the second pass re-scoring stage.
  751. The will only execute on N-best entries from the first pass that are
  752. within the specified delta from each other. Concept: if the first pass
  753. gives a big delta, you can be fairly confident that the second
  754. N-best is not the correct answer, and a second pass re-score
  755. will probably not force it to the top either. Higher numbers
  756. can increase accuracy, but will slow response time. -->
  757. <param name="swirec_max_rescore_delta">
  758. <value>500</value>
  759. <value>500</value>
  760. <value>500</value>
  761. <value>500</value>
  762. </param>
  763.  
  764. <!-- For Nuance use only. Related to the second pass re-scoring stage.
  765. Controls the absolute time spent for rescoring. -->
  766. <param name="swirec_max_rescore_time">
  767. <value>20000</value>
  768. <value>20000</value>
  769. <value>20000</value>
  770. <value>20000</value>
  771. </param>
  772.  
  773. <!-- The maximum amount of time that the recognizer spends
  774. to recognize an answer. Milliseconds. -->
  775. <param name="swirec_max_cpu_time">
  776. <value>20000</value>
  777. </param>
  778.  
  779. <!-- The maximum time of the search phase of recognition. Milliseconds. -->
  780. <param name="swirec_max_search_time">
  781. <value>5000</value>
  782. </param>
  783.  
  784. <!-- Defines an approximate usage percentage as &quot;normal&quot; CPU load.
  785. When usage is normal, the recognizer can dynamically use more CPU
  786. to improve accuracy. -->
  787. <param name="swirec_normal_cpu_start">
  788. <value>15</value>
  789. </param>
  790.  
  791. <!-- Defines an approximate usage percentage as &quot;busy&quot; CPU load.
  792. When usage is busy, the recognizer does not use extra CPU
  793. to refine its results. -->
  794. <param name="swirec_busy_cpu_start">
  795. <value>40</value>
  796. </param>
  797.  
  798. <!-- Defines an approximate usage percentage as &quot;maxium&quot; CPU load.
  799. When usage is pegged, the recognizer minimizes CPU usage. -->
  800. <param name="swirec_pegged_cpu_start">
  801. <value>101</value>
  802. </param>
  803.  
  804. <!-- The maximum number of candidates to consider when attempting
  805. to fill the nbest list. This is not the preferred way to control
  806. nbest processing and should only be set small when there is a specific
  807. reason each sentence is very expensive (like a computationally intense
  808. ECMAscript). Otherwise accuracy and confidence can be seriously impaired
  809. for no reason. By default (value of 99999999) this parameter has no effect.
  810. This parameter can also be set via SetParameter or a &lt;meta&gt; in a grammar. -->
  811. <param name="swirec_max_sentences_tried">
  812. <value>999999</value>
  813. </param>
  814.  
  815. <!-- This is the main search parameter guiding the Viterbi beam search.
  816. It is used to prune all active paths. These are paths either active
  817. during Hmm state propagation or paths active during FSM state propagation. -->
  818. <param name="swirec_state_beam">
  819. <value>0</value>
  820. <value>-15</value>
  821. <value>-45</value>
  822. <value>-45</value>
  823. </param>
  824.  
  825. <!-- This is equivalent to the above state_beam, but for the parallel
  826. deocding of the GSM only. -->
  827. <param name="swirec_gsm_state_beam">
  828. <value>-50</value>
  829. </param>
  830.  
  831. <!-- This determines the vocab threshold that decides whether we use the full or small
  832. gsm. However, we always use the small gsm in busy -->
  833. <param name="swirec_gsm_vocab_size_threshold">
  834. <value>100</value>
  835. </param>
  836.  
  837. <!-- Determines how much the phoneme look-ahead influences the Viterbi beam search.
  838. Typically this parameter is set to match the beam search parameter.
  839. Conceivably a better trade-off can be achieved by using a tighter beam
  840. for the phoneme look-ahead compared to the main Viterbi beam. -->
  841. <param name="swirec_phoneme_lookahead_beam">
  842. <value>-30</value>
  843. <value>-45</value>
  844. <value>-60</value>
  845. <value>-60</value>
  846. </param>
  847.  
  848. <!-- Determines how much to reduce the state beam when the current best path i
  849. ends in a silence model. This effectively reduces the search space by
  850. tighter pruning when the search is confident of being in a silence region. -->
  851. <param name="swirec_silence_prune_offset">
  852. <value>56</value>
  853. <value>56</value>
  854. <value>56</value>
  855. <value>56</value>
  856. </param>
  857.  
  858. <!-- Maximum number of FSM arcs that can be active at any time. This parameter
  859. is used to guide the histogram pruning algorithm that dynamically adjusts
  860. the state beam to ensure the total number of active arcs does not
  861. exceed swirec_max_arcs. -->
  862. <param name="swirec_max_arcs">
  863. <value>10000</value>
  864. <value>6000</value>
  865. <value>3000</value>
  866. <value>3000</value>
  867. </param>
  868.  
  869. <!-- For Nuance use only. The word beam applies only at word endings. The
  870. hypothesis is that search paths at end of words can be pruned tighter than
  871. other paths, without loss of accuracy. -->
  872. <param name="swirec_word_beam">
  873. <value>-50</value>
  874. </param>
  875.  
  876. <!-- For Nuance use only. Penalty for self loop transitions in the Hmm model -->
  877. <param name="swirec_loop_penalty">
  878. <value>0.3</value>
  879. </param>
  880.  
  881. <!-- For Nuance use only. Penalty for next state transition in Hmm model. -->
  882. <param name="swirec_next_penalty">
  883. <value>0.2</value>
  884. </param>
  885.  
  886. <!-- For Nuance use only. Penalty to skip a Hmm state. -->
  887. <param name="swirec_skip_penalty">
  888. <value>0.6</value>
  889. </param>
  890.  
  891. <!-- For Nuance use only. Penalty for entering silence model. -->
  892. <param name="swirec_pause_penalty">
  893. <value>0.6</value>
  894. </param>
  895.  
  896. <!-- For Nuance use only. Self loop penalty for the Hmm silence state. -->
  897. <param name="swirec_silence_penalty">
  898. <value>0.0</value>
  899. </param>
  900.  
  901. <!-- For Nuance use only. Penalty for entering a whole word unit model. -->
  902. <param name="swirec_whole_word_unit_penalty">
  903. <value>2.0</value>
  904. </param>
  905.  
  906. <!-- For Nuance use only. Word transition penalty. -->
  907. <param name="swirec_word_penalty">
  908. <value>1.0</value>
  909. </param>
  910.  
  911. <!-- For Nuance use only. Start-of-sentence cost. -->
  912. <param name="swirec_sentence_initial_cost">
  913. <value>1.0</value>
  914. </param>
  915.  
  916. <!-- For Nuance use only. Forward search forces a
  917. model restart if this number of frames have passed -->
  918. <param name="swirec_restart_neighborhood">
  919. <value>25</value>
  920. </param>
  921.  
  922. <!-- For Nuance use only. Generate lattice states for
  923. one frame over two; value 0 is turn off -->
  924. <param name="swirec_lattice_decimation">
  925. <value>0</value>
  926. </param>
  927.  
  928. <!-- For Nuance use only: Phonetic Pruning activation -->
  929. <param name="swirec_ppr_active">
  930. <value>1</value>
  931. </param>
  932.  
  933. <!-- For Nuance use only.
  934. threshold of phone posterior to prune start arc -->
  935. <param name="swirec_ppr_start_thres">
  936. <value>0.00001</value>
  937. </param>
  938.  
  939. <!-- For Nuance use only.
  940. threshold of phone posterior to prune existing arc -->
  941. <param name="swirec_ppr_exist_thres">
  942. <value>0.0</value>
  943. </param>
  944.  
  945. <!-- For Nuance use only.
  946. maximum threshold of phone posterior to prune arc after correction
  947. based on position in the beam -->
  948. <param name="swirec_ppr_max_thres">
  949. <value>0.01</value>
  950. </param>
  951.  
  952. <!-- For Nuance use only.
  953. Scaling factor use to correct the ppr threshold -->
  954. <param name="swirec_ppr_thres_scale_factor">
  955. <value>170.667</value>
  956. </param>
  957.  
  958.  
  959. <!-- For Nuance use only. Whether to share contents of public rules referenced by other public
  960. rules. Turning on speeds grammar compilation and lowers compiled memory
  961. size but results in recognition-time CPU increase. -->
  962. <param name="swirec_shared_publics">
  963. <value>0</value>
  964. </param>
  965.  
  966. <!-- For Nuance use only. Max number of nodes that can be visited during the astar search
  967. before it is aborted -->
  968. <param name="swirec_astar_max_paths">
  969. <value>100000</value>
  970. </param>
  971.  
  972. <!-- Turning on causes an implicit-root (of all grammar publics) to
  973. be defined if an explicit root rule is not declared in the grammar.
  974. Note that this behavior does not seem to be compatible with
  975. the relevant w3c specifications. -->
  976. <param name="swirec_compute_implicit_root">
  977. <value>0</value>
  978. </param>
  979.  
  980. <!-- ***************************************************************** -->
  981. <!-- * Parameters related to DEBUGGING * -->
  982. <!-- ***************************************************************** -->
  983.  
  984. <!-- Maximum n-best entries logged in event log. -->
  985. <param name="swirec_max_logged_nbest">
  986. <value>2</value>
  987. </param>
  988.  
  989. <!-- For Nuance use only. Turns on/off the writing of a computation statistics
  990. file. These statistics show the amounts of time spent during various
  991. recognition steps. -->
  992. <param name="swirec_save_comp_stats">
  993. <value>0</value>
  994. </param>
  995.  
  996. <!-- Disable post-endpointed waveform logging entirely. -->
  997. <param name="swirec_suppress_waveform_logging">
  998. <value>0</value>
  999. </param>
  1000.  
  1001. <!-- Disable logging of recognition events. -->
  1002. <param name="swirec_suppress_event_logging">
  1003. <value>0</value>
  1004. </param>
  1005.  
  1006. <!-- Current recognition should be treated as sensitive information
  1007. and thus suppressed according to suppression rules. -->
  1008. <param name="secure_context">
  1009. <value>0</value>
  1010. </param>
  1011.  
  1012. <!-- Suppressed sensitive information from URI according to suppression
  1013. rules. Not settable at runtime. Default to '0' (do not suppress) -->
  1014. <param name="secure_context_uri">
  1015. <value>0</value>
  1016. </param>
  1017.  
  1018. <!-- Max channels to simultaneously save waveforms. -->
  1019. <param name="swirec_waveform_logging_max_channels">
  1020. <value>-1</value>
  1021. </param>
  1022.  
  1023. <!-- Timeout (seconds) for inactive channel when max_channels
  1024. is set, Specifies the number of seconds during which a rec
  1025. handle must be idle in order to be considered inactive and
  1026. therefore not logging any waveforms -->
  1027. <param name="swirec_waveform_logging_channel_timeout">
  1028. <value>300</value>
  1029. </param>
  1030.  
  1031. <!-- Allows/disallows obtaining waveforms by calling SWIrecGetWaveform() -->
  1032. <param name="swirec_return_waveform">
  1033. <value>1</value>
  1034. </param>
  1035.  
  1036. <!-- Length of leading silence (msecs) in returned waveform
  1037. when calling SWIrecGetWaveformEx with 'begin' silence_suppression -->
  1038. <param name="swirec_waveform_begin_silence">
  1039. <value>0</value>
  1040. </param>
  1041.  
  1042. <!-- Length of trailing silence (msecs) in returned waveform
  1043. when calling SWIrecGetWaveformEx with 'end' silence_suppression -->
  1044. <param name="swirec_waveform_end_silence">
  1045. <value>0</value>
  1046. </param>
  1047.  
  1048. <!-- Maximum length of interword silence (msecs) in returned waveform
  1049. when calling SWIrecGetWaveformEx with 'interword' silence_suppression -->
  1050. <param name="swirec_waveform_interword_max">
  1051. <value>0</value>
  1052. </param>
  1053.  
  1054. <!-- Percentage of the maximum waveform amplitude to be used
  1055. as threshold for detecting speech -->
  1056. <param name="swirec_waveform_speech_thresh">
  1057. <value>10.0</value>
  1058. </param>
  1059.  
  1060. <!-- Safety margin (msecs) extending the BOS and EOS in the waveform -->
  1061. <param name="swirec_waveform_speech_backoff">
  1062. <value>50</value>
  1063. </param>
  1064.  
  1065. <!-- ***************************************************************** -->
  1066. <!-- * NEVER CHANGE WITHOUT Nuance authorization * -->
  1067. <!-- ***************************************************************** -->
  1068.  
  1069. <!-- For Nuance use only. -->
  1070. <!-- Wait if completetimeout is gt incompletetimeout -->
  1071. <param name="swirec_allow_wait_completetimeout">
  1072. <value>0</value>
  1073. </param>
  1074.  
  1075. <!-- For Nuance use only. -->
  1076. <!-- If relative, this file path is relative to baseline (SWISRSDK). -->
  1077. <param name="swifeature_config_name">
  1078. <value>generic/models/feature.txt</value>
  1079. </param>
  1080.  
  1081. <!-- For Nuance use only. -->
  1082. <!-- File containing data related to confidence and rejection. -->
  1083. <param name="swirec_reject_info_name">
  1084. <value>generic/models/reject.text</value>
  1085. </param>
  1086.  
  1087. <!-- For Nuance use only. Sets up path to OSR language-specific configuration files. -->
  1088. <!-- If relative, this file path is relative to baseline (SWISRSDK). -->
  1089. <param name="swirec_language_baseline">
  1090. <value>@LANGUAGENAME@/@[email protected]</value>
  1091. </param>
  1092.  
  1093. <param name="swirec_rp_info_name">
  1094. <value>generic/rp_info.txt</value>
  1095. </param>
  1096.  
  1097. <param name="swirec_fixed_score_delta_conf">
  1098. <value>0</value>
  1099. </param>
  1100.  
  1101. </lang>
  1102.  
  1103. </SWIrecConfig>
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement