From sumomo @ users.sourceforge.jp Thu Oct 2 17:21:57 2008 From: sumomo @ users.sourceforge.jp (sumomo @ users.sourceforge.jp) Date: Thu, 02 Oct 2008 17:21:57 +0900 Subject: [Julius-cvs 271] CVS update: julius4/man Message-ID: <1222935717.476031.30552.nullmailer@users.sourceforge.jp> From sumomo @ users.sourceforge.jp Thu Oct 2 17:22:04 2008 From: sumomo @ users.sourceforge.jp (sumomo @ users.sourceforge.jp) Date: Thu, 02 Oct 2008 17:22:04 +0900 Subject: [Julius-cvs 272] CVS update: julius4/man/ja Message-ID: <1222935724.049239.31404.nullmailer@users.sourceforge.jp> From sumomo @ users.sourceforge.jp Thu Oct 2 17:23:45 2008 From: sumomo @ users.sourceforge.jp (sumomo @ users.sourceforge.jp) Date: Thu, 02 Oct 2008 17:23:45 +0900 Subject: [Julius-cvs 273] CVS update: julius4/adinrec Message-ID: <1222935825.381077.32204.nullmailer@users.sourceforge.jp> Index: julius4/adinrec/00readme-ja.txt diff -u julius4/adinrec/00readme-ja.txt:1.2 julius4/adinrec/00readme-ja.txt:1.3 --- julius4/adinrec/00readme-ja.txt:1.2 Tue Dec 18 23:08:21 2007 +++ julius4/adinrec/00readme-ja.txt Thu Oct 2 17:23:45 2008 @@ -1,68 +1,130 @@ + adinrec + ADINREC(1) ADINREC(1) -NAME - adinrec - record one sentence utterance to a file +?? + adinrec + - ????????????????????? -SYNOPSIS - adinrec [options..] filename +?? + adinrec [options...] {filename} DESCRIPTION - adinrec ? ????????????????t???????????? - ?? - - ?????????????????????ョ? 16bit monoral ?????- ????f???ョ? WAV ???????????????????????- ?????D - - ????????? "-" ????????o???????D????f?? - ?ョ?RAW?????? + adinrec ??????????????????????????????? + ???????????C???????????????????f??? + ?????????????????-input ?????? ???????? + ????????????????????? + + ????????????????????????ョ? 16bit, 1 channel + ??????o????????ョ? Microsoft WAV ?ョ???? ???? + ?????????????????????D - ? ?????????C???????????????????????? - ???????? + ?????? "-" ???????????????????o????? + ??????f???ョ? RAW ?ョ???? OPTIONS - -freq threshold - ????????????? Hz (default: 16000) - - -lv threslevel - ????????????? (0 - 32767)?(default: 2000)? - - -zc zerocrossnum - ??????????????? (default: 60) - - -margin msec - ??????????????O???? ? ?? ? ? ? ? ? ? - (default: 300) - - -nostrip - ? ?? 0 ?????ゥ????s???????????????ゥ - ????s?? - - -zmean DC?????s?? - - -raw RAW???????????s???ョ? 16bit, big endian ???? + Julius ????????????????????????????? ?? + ???????????????????????adinrec ?ゥ? ????? + ????? Julius ?????????????? + + adinrec specific options + -freq Hz + ???????????? (Hz) ??????(default: 16,000) + + -raw + RAW?????ョ?????D + + Concerning Julius options + -input {mic|rawfile|adinnet|stdin|netaudio|esd|alsa|oss} + ?????????????????????????file??? + ?rawfile?? ?????????????????????????? + ??? ????????adinnet ??? adintool ?????????? + ??????? ???????????????????????? + netaudio ?DatLink??????? stdin????????????s?? + esd??????????????????? Linux?????????? + ??????? EsounD daemon ??????? + + -lv thres + ????????????? 0 ?? 32767 ????????? (default: + 2000) + + -zc thres + ??????????????????????????? (default: 60) + + -headmargin msec + ???????????????????? (default: 300) + + -tailmargin msec + ????????}??????????? (default: 400) + + -zmean + ????????????????????s???????????? + ?????????D + + -smpFreq Hz + ???????????? (Hz) ??????(default: 16,000) + + -48 + 48kHz???????16kHz????????????? ??? 16kHz ?? + ??????????????????? ?????????????? + ? sptk ?? ?????? (Rev. 4.0) + + -NA devicename + DatLink ????????? (-input netaudio). + + -adport port_number + + -input adinnet ???????????? adinnet ?????????? + ??(default: 5530) + + -nostrip + ??????????????????????????????? ? + "0" ??????????????????Julius ???C?? ???? + ?????????????????D??????????????? + ????C???????????????ゥ???????????? + ???? + + -C jconffile + jconf?????????????????????????W????? + + -plugindir dirlist + ????????????????????????????????? + ??????????? + +ENVIRONMENT VARIABLES + ALSADEV + (?????? alsa ???????) ????????????? ??? + ?????"default"? + + AUDIODEV + (?????? oss ???????) ????????????? ??? + ?????"/dev/dsp"? + + LATENCY_MSEC + Linux (alsa/oss) ??? Windows ??????????????? ?? + ????????????????????????????????CPU + ????????????????????????OS? ??????? + ?????????????OS ????????? ?????????? + ???????????? SEE ALSO - adintool(1), julius(1), sox(1), wavplay(1), wavrec(1), aplay(1), - arecord(1) - -BUGS - ?????????????????? julius @ lavender.ics.nitech.ac.jp? - ???????? + julius ( 1 ) , + adintool ( 1 ) COPYRIGHT - Copyright (c) 1991-2006 ???? ????コ - Copyright (c) 2000-2005 ?????????w??? ュ???コ - Copyright (c) 2005-2006 ??????? Julius????? + Copyright (c) 1991-2008 ???? ????コ + + Copyright (c) 1997-2000 ????U?????(IPA) + + Copyright (c) 2000-2008 ?????????w??? ュ???コ -AUTHORS - ? ?? (???????) ?タ?????? + Copyright (c) 2005-2008 ??????? Julius????? LICENSE Julius ??????????D -4.3 Berkeley Distribution LOCAL ADINREC(1) + 10/02/2008 ADINREC(1) Index: julius4/adinrec/00readme.txt diff -u julius4/adinrec/00readme.txt:1.2 julius4/adinrec/00readme.txt:1.3 --- julius4/adinrec/00readme.txt:1.2 Tue Dec 18 23:08:21 2007 +++ julius4/adinrec/00readme.txt Thu Oct 2 17:23:45 2008 @@ -1,62 +1,130 @@ + adinrec + ADINREC(1) ADINREC(1) NAME - adinrec - record one sentence utterance to a file + adinrec + - record audio device and save one utterance to a file SYNOPSIS - adinrec [options..] filename + adinrec [options...] {filename} DESCRIPTION - adinrec records one spoken utterance from microphone to a file. + adinrec opens an audio stream, detects an utterance input and store it + to a specified file. The utterance detection is done by level and + zero-cross thresholds. Default input device is microphone, but other + audio input source, including Julius A/D-in plugin, can be used by + using "-input" option. - Output format is WAV, 16bit, monoral, no compression. If the file - already exist, it will be overridden. If filename of "-" is specified, - recorded data will be output to stdout. + The audio format is 16 bit, 1 channel, in Microsoft WAV format. If the + given filename already exists, it will be overridden. - The sensitiveness of speech detection can be controlled by thresholds - of zerocross number and power (level). + If filename is "-" , the captured data will be streamed into standard + out, with no header (raw format). OPTIONS - -freq threshold - Sampling frequency (Hz, default=16000) - - -lv threslevel - Level threshold (0-32767, default=2000) - - -zc zerocrossnum - Zero cross number threshold in a second (default=60) - - -margin msec - Record margin before/after the detected segment (milliseconds, - default=300) - - -nostrip - Disable skipping of invalid zero samples (default: enabled) + adinrec uses JuliusLib and adopts Julius options. Below is a list of + valid options. - -zmean Enable zero mean subtraction to remove DC offset. - - -raw RAW format output (default: WAV) + adinrec specific options + -freq Hz + Set sampling rate in Hz. (default: 16,000) + + -raw + Output in raw file format. + + JuliusLib options + -input {mic|rawfile|adinnet|stdin|netaudio|esd|alsa|oss} + Choose speech input source. Specify 'file' or 'rawfile' for waveform + file. On file input, users will be prompted to enter the file name + from stdin. + + 'mic' is to get audio input from a default live microphone device, + and 'adinnet' means receiving waveform data via tcpip network from + an adinnet client. 'netaudio' is from DatLink/NetAudio input, and + 'stdin' means data input from standard input. + + At Linux, you can choose API at run time by specifying alsa, oss and + esd. + + -lv thres + Level threshold for speech input detection. Values should be in + range from 0 to 32767. (default: 2000) + + -zc thres + Zero crossing threshold per second. Only input that goes over the + level threshold (-lv) will be counted. (default: 60) + + -headmargin msec + Silence margin at the start of speech segment in milliseconds. + (default: 300) + + -tailmargin msec + Silence margin at the end of speech segment in milliseconds. + (default: 400) + + -zmean + This option enables DC offset removal. + + -smpFreq Hz + Set sampling rate in Hz. (default: 16,000) + + -48 + Record input with 48kHz sampling, and down-sample it to 16kHz + on-the-fly. This option is valid for 16kHz model only. The + down-sampling routine was ported from sptk. (Rev. 4.0) + + -NA devicename + Host name for DatLink server input (-input netaudio). + + -adport port_number + With -input adinnet, specify adinnet port number to listen. + (default: 5530) + + -nostrip + Julius by default removes successive zero samples in input speech + data. This option stop it. + + -C jconffile + Load a jconf file at here. The content of the jconffile will be + expanded at this point. + + -plugindir dirlist + Specify which directories to load plugin. If several direcotries + exist, specify them by colon-separated list. + +ENVIRONMENT VARIABLES + ALSADEV + Device name string for ALSA. (default: "default") + + AUDIODEV + Device name string for OSS. (default: "/dev/dsp") + + LATENCY_MSEC + Input latency of microphone input in milliseconds. Smaller value + will shorten latency but sometimes make process unstable. Default + value will depend on the running OS. SEE ALSO - adintool(1), julius(1), sox(1), wavplay(1), wavrec(1), aplay(1), - arecord(1) + julius ( 1 ) , + adintool ( 1 ) COPYRIGHT - Copyright (c) 1991-2006 Kawahara Lab., Kyoto University - Copyright (c) 2000-2005 Shikano Lab., Nara Institute of Science and + Copyright (c) 1997-2000 Information-technology Promotion Agency, Japan + + Copyright (c) 1991-2008 Kawahara Lab., Kyoto University + + Copyright (c) 2000-2005 Shikano Lab., Nara Institute of Science and Technology - Copyright (c) 2005-2006 Julius project team, Nagoya Institute of Tech- - nology -AUTHORS - LEE Akinobu (Nagoya Institute of Technology, Japan) - contact: julius @ lavender.ics.nitech.ac.jp + Copyright (c) 2005-2008 Julius project team, Nagoya Institute of + Technology LICENSE - Same as Julius. + The same as Julius. -4.3 Berkeley Distribution LOCAL ADINREC(1) + 10/02/2008 ADINREC(1) Index: julius4/adinrec/adinrec.man diff -u julius4/adinrec/adinrec.man:1.1.1.1 julius4/adinrec/adinrec.man:removed --- julius4/adinrec/adinrec.man:1.1.1.1 Fri Sep 28 11:50:55 2007 +++ julius4/adinrec/adinrec.man Thu Oct 2 17:23:45 2008 @@ -1,56 +0,0 @@ -.de Sp -.if t .sp .5v -.if n .sp -.. -.de Ip -.br -.ie \\n.$>=3 .ne \\$3 -.el .ne 3 -.IP "\\$1" \\$2 -.. -.TH ADINREC 1 LOCAL -.UC 6 -.SH NAME -adinrec - record one sentence utterance to a file -.SH SYNOPSIS -.B adinrec [options..] filename -.SH DESCRIPTION -.I adinrec -records one spoken utterance from microphone to a file. -.PP -Output format is WAV, 16bit, monoral, no compression. -If the file already exist, it will be overridden. If -filename of "-" is specified, recorded data will be output to stdout. -.PP -The sensitiveness of speech detection can be controlled by thresholds -of zerocross number and power (level). -.SH OPTIONS -.Ip "\-freq threshold" -Sampling frequency (Hz, default=16000) -.Ip "\-lv threslevel" -Level threshold (0-32767, default=2000) -.Ip "\-zc zerocrossnum" -Zero cross number threshold in a second (default=60) -.Ip "\-margin msec" -Record margin before/after the detected segment (milliseconds, default=300) -.Ip "\-nostrip" -Disable skipping of invalid zero samples (default: enabled) -.Ip "\-zmean" -Enable zero mean subtraction to remove DC offset. -.Ip "\-raw" -RAW format output (default: WAV) -.SH "SEE ALSO" -adintool(1), julius(1), sox(1), wavplay(1), wavrec(1), aplay(1), arecord(1) -.SH COPYRIGHT -Copyright (c) 1991-2006 Kawahara Lab., Kyoto University -.br -Copyright (c) 2000-2005 Shikano Lab., Nara Institute of Science and Technology -.br -Copyright (c) 2005-2006 Julius project team, Nagoya Institute of Technology -.SH AUTHORS -LEE Akinobu (Nagoya Institute of Technology, Japan) -.br -contact: julius @ lavender.ics.nitech.ac.jp -.SH LICENSE -Same as -.I Julius. Index: julius4/adinrec/adinrec.man.ja diff -u julius4/adinrec/adinrec.man.ja:1.1.1.1 julius4/adinrec/adinrec.man.ja:removed --- julius4/adinrec/adinrec.man.ja:1.1.1.1 Fri Sep 28 11:50:55 2007 +++ julius4/adinrec/adinrec.man.ja Thu Oct 2 17:23:45 2008 @@ -1,60 +0,0 @@ -.de Sp -.if t .sp .5v -.if n .sp -.. -.de Ip -.br -.ie \\n.$>=3 .ne \\$3 -.el .ne 3 -.IP "\\$1" \\$2 -.. -.TH ADINREC 1 LOCAL -.UC 6 -.SH NAME -adinrec - record one sentence utterance to a file -.SH SYNOPSIS -.B adinrec [options..] filename -.SH DESCRIPTION -.I adinrec -はマイク入力の音声区間を切り出してファイルに記録するツールです. -.PP -サンプリング周波数は任意に設定可能です.形式は 16bit monoral です.書き出されるデータ形式は WAV です. -既に同じ名前のファイルが存在する場合は上書きします. -.PP -また,ファイル名に "-" を指定すると標準出力へ出力します.この場合データ形式はRAWになります. -.PP -音声区間の切り出しは,一定時間内の零交差数とパワー(振幅レベル)の -しきい値を用います. -.SH OPTIONS -.Ip "\-freq threshold" -サンプリング周波数.単位は Hz (default: 16000) -.Ip "\-lv threslevel" -波形の振幅レベルのしきい値 (0 - 32767).(default: 2000). -.Ip "\-zc zerocrossnum" -1秒あたりの零交差数のしきい値 (default: 60) -.Ip "\-margin msec" -音声区間開始部および終了部の前後のマージン.単位はミリ秒 -(default: 300) -.Ip "\-nostrip" -無効な 0 サンプルの自動除去を行わないようにする. -デフォルトは自動除去を行う. -.Ip "\-zmean" -DC成分除去を行う. -.Ip "\-raw" -RAWフォーマットでの出力を行う.形式は 16bit, big endian である. -.SH "SEE ALSO" -adintool(1), julius(1), sox(1), wavplay(1), wavrec(1), aplay(1), arecord(1) -.SH BUGS -バグ報告・問い合わせ・コメントなどは -julius @ lavender.ics.nitech.ac.jpまでお願いします. -.SH COPYRIGHT -Copyright (c) 1991-2006 京都大学 河原研究室 -.br -Copyright (c) 2000-2005 奈良先端科学技術大学院大学 鹿野研究室 -.br -Copyright (c) 2005-2006 名古屋工業大学 Julius開発チーム -.SH AUTHORS -李 晃伸 (名古屋工業大学) が実装しました. -.SH LICENSE -.I Julius -の使用許諾に準じます. From sumomo @ users.sourceforge.jp Thu Oct 2 17:23:45 2008 From: sumomo @ users.sourceforge.jp (sumomo @ users.sourceforge.jp) Date: Thu, 02 Oct 2008 17:23:45 +0900 Subject: [Julius-cvs 274] CVS update: julius4/generate-ngram Message-ID: <1222935825.756995.32227.nullmailer@users.sourceforge.jp> Index: julius4/generate-ngram/00readme-ja.txt diff -u /dev/null julius4/generate-ngram/00readme-ja.txt:1.1 --- /dev/null Thu Oct 2 17:23:45 2008 +++ julius4/generate-ngram/00readme-ja.txt Thu Oct 2 17:23:45 2008 @@ -0,0 +1,60 @@ + generate-ngram + +GENERATE-NGRAM(1) GENERATE-NGRAM(1) + + + +?? + generate-ngram + - N-gram ????????_????? + +?? + generate-ngram [options...] {binary_ngram} + +DESCRIPTION + generate-ngram ??????? N-gram ??????????_????? + ??????binary_ngram ??? ?????ョ? N-gram ???????? + ??? + +OPTIONS + -n num + ??????????????????10? + + -N + ???? N-gram ?????????????????????????? + ?????????3-gram ?? 3?? + + -bos + ?????????????????? + + -eos + ???L?????????????? + + -ignore + ?????????P?????????????? + + -v + ???o????? + + -debug + ????????s?? + +SEE ALSO + julius ( 1 ) , + mkbingram ( 1 ) + +COPYRIGHT + Copyright (c) 1991-2008 ???? ????コ + + Copyright (c) 1997-2000 ????U?????(IPA) + + Copyright (c) 2000-2008 ?????????w??? ュ???コ + + Copyright (c) 2005-2008 ??????? Julius????? + +LICENSE + Julius ??????????D + + + + 10/02/2008 GENERATE-NGRAM(1) Index: julius4/generate-ngram/00readme.txt diff -u /dev/null julius4/generate-ngram/00readme.txt:1.1 --- /dev/null Thu Oct 2 17:23:45 2008 +++ julius4/generate-ngram/00readme.txt Thu Oct 2 17:23:45 2008 @@ -0,0 +1,62 @@ + generate-ngram + +GENERATE-NGRAM(1) GENERATE-NGRAM(1) + + + +NAME + generate-ngram + - random sentence generator from N-gram + +SYNOPSIS + generate-ngram [options...] {binary_ngram} + +DESCRIPTION + generate-ngram is a tool to generate sentences randomly according to + the given N-gram language model. The N-gram model file binary_ngram + should be an binary format. + +OPTIONS + -n num + Number of sentences to generate (default: 10) + + -N + Specify which length of N-gram to use (default: available max in the + given model) + + -bos + Beginning-of-sentence word (default: "") + + -eos + End-of-sentence word (default: "") + + -ignore + Specify a word to be supressed from output (default: " Index: julius4/gramtools/00readme-ja.txt diff -u julius4/gramtools/00readme-ja.txt:1.1.1.1 julius4/gramtools/00readme-ja.txt:1.2 --- julius4/gramtools/00readme-ja.txt:1.1.1.1 Fri Sep 28 11:50:55 2007 +++ julius4/gramtools/00readme-ja.txt Thu Oct 2 17:23:45 2008 @@ -8,255 +8,5 @@ gram2sapixml Julian ?ョ???? SAPI XML ???????????? dfa_determinize DFA?????? -====================================================================== -?????? - -???????? Julius ????????????? -??????ゥ???????????????????? - -???????????????????@?????????? -??????? Julius ???????????????? -??????????????? Julius ??????????????? -????????? - - 0) ????????タ?????????????????????? - - ?perl (ver.5) - ?GNU bison - ?GNU flex - ?GNU readline ????? - ?iconv - ?perl ? Jcode????? - - 1) ???????? julius ???????? - ??????????????? - - % cd .. - % ./configure - % make - % cd gramtools - - 2) ???????? configure ? make ?タ???? - - % ./configure - % make - - 4) ???????s????? "make install" ? /usr/local/bin ? - ????????? - - % make install - - - -====================================================================== -====================================================================== -====================================================================== -??????????? - - -====================================================================== -? mkdfa.pl --- ??????? - - mkdfa.pl ? Julian ??????????????????@????. -grammar ??????? .voca ?? Julian?? DFA ??ッォ???????D - - ????????????????????????? - ???????????r????????????? - - mkdfa.pl???????????? .grammar ??? .voca??????? -?????????????????????????????L????? -???????????????? - ------------------------------------------------------------- - タ???../sample_grammars/vfr/vfr.{grammar,voca}???? - - % mkdfa.pl ../sample_grammars/vfr/vfr - - ???? ../sample_grammars/vfr/vfr.{dfa,dict,term} ??????? ------------------------------------------------------------- - - ????????????????NFA????????DFA??????? -??????s?????.dfa ???????????????????. -dict ???????????????????????ォ????????D - - ????? .dfa ??????????????????ID?????? -????ID? .grammar ??????????????????? .term ?? -?????o???????????? generate ? nextword ?????? -???????????????? - - mkdfa ?タ??????????? mkfa????タ?????? mkdfa.pl -???????????????????mkdfa.pl ??????????? - - ??????t?????ョ????????C??????????D - - -====================================================================== -? dfa_minimize --- DFA???c?? - - DFA ?????????????A?????????C -???????FA??????? - -?????? mkdfa.pl ? DFA ???????ゥ??????????D -??? DFA ??????s?????L???????????? - - ?????????????DFA?????????????????? -???W???????????D???????FA????? -"-o ?????" ????????????????W?o???????D ------------------------------------------------------------- - ???1: - - % dfa_minimize vfr.dfa -o vfr-min.dfa - - ???2: - - % cat vfr.dfa | dfa_minimize > vfr-min.dfa - ------------------------------------------------------------- - - -====================================================================== -? generate --- ?????????? - - ??????????_???????????????????????? -??????????? - - タ??? .dfa, .dict, .term ??????????? mkdfa.pl ? -??????????? - ------ タ?? ------------------------------------------- - % bin/generate ../sample_grammars/vfr/vfr <-- ?? - Reading in dictionary...done - Reading in DFA grammar...done - Mapping dict item <-> DFA terminal (category)...done - Reading in term file (optional)...done - 42 categories, 99 words - DFA has 135 nodes and 198 arcs - ----- - silB ???? silE - silB ?????silE - silB ??? ? ??? ? ???? ??? silE - silB ??? ? ???? ? ?? ? ? ???? ??? silE - silB ???? ??? silE - silB ?? ? ?????? ??? silE - silB ?????? ??? silE - silB ??? ??? silE - silB ??? ? ??? ? ???? ??? silE - silB ??? ? ? ?? ??? silE - % --------------------------------------------------------- -????? "-n num" ??????????????????????10??? -????? "-t" ???????????????????(.term???)? - - -====================================================================== -? accept_check --- ??????/?????????? - - ??????????????????????????????????-??????????????????????????????? mkdfa.pl -???? .dfa, .dict, .term ???????????? - - ??????transcription?????????????????C??? -accept_check ??????^???????????????????? -?????????????? - - mkdfa.pl?????????????????????????????? -.dfa, .dict, .term?????????????????transcript???? - ??????transcript??????? - ??L?????????????????????? - ?accepted / rejected -??????D - - transcript?????????.voca??1?????)????????? -????????????????silB, silE ????????????? -?????????? sp ?transcript????????????????? -?transcript???????C.voca?????????????????? -????????????? - ----- タ?? --------------------------------------------- - % bin/accept_check ../sample_grammars/vfr/vfr <-- ?? - Reading in dictionary...done - Reading in DFA grammar...done - Mapping dict item <-> DFA terminal (category)...done - Reading in term file (optional)...done - 42 categories, 99 words - DFA has 135 nodes and 198 arcs - ----- - please input word sequence>silB ? ? ?? ??? silE <-- ?? - wseq: silB ? ? ?? ??? silE - cate: NS_B COLOR_N (NI|NI_AT) SURU_V KUDASAI_V NS_E - accepted - please input word sequence> ---------------------------------------------------------- - -???????????????????????゚?????????C -accept_check?????????????????(?Lタ??????)? - -??????? "-t" ????????????????????????? -???????????????C?????????P????????? -?????????????? - - -====================================================================== -? nextword --- ?????????????accept_check?????? - - ??????????????????????P?????o????? - - ??????????????P??/?????????????? - - ?????? mkdfa.pl ???? .dfa, .dict, .term ???????????? - - ???? ???????(right-to-left)??????????????? -Julian ??2??????????????????T?????????? -??????????????????? - ----- タ?? --------------------------------------------- - % bin/nextword ../sample_grammars/vfr/vfr <-- ?? - Reading in dictionary...done - Reading in DFA grammar...done - Mapping dict item <-> DFA terminal (category)...done - Reading in term file (optional)...done - 42 categories, 99 words - DFA has 135 nodes and 198 arcs - ----- - wseq > ? ?? ??? silE <-- ?? - [wseq: ? ?? ??? silE] - [cate: (NI|NI_AT) SURU_V KUDASAI_V NS_E] - PREDICTED CATEGORIES/WORDS: - KEIDOU_A (?? ?? ) - BANGOU_N (? ) - HUKU_N (? ?? ?? ) - PATTERN_N (???? ???ネ ...) - GARA_N (? ) - KANZI_N (?? ) - IRO_N (? ) - COLOR_N (? ? ? ...) - wseq > --------------------------------------------------------- - -transcript?????????macs???????????C -????????????? - - TAB ???????"-t"?????????????? - ????????????ヲ? - Ctrl-L ???????}?(??????????)? - Ctrl-P?Ctrl-N ??????D - -??????????? readline ?????????????????????D - -====================================================================== -? gram2sapixml --- Julian ?ョ???? SAPI XML ???????????? - -gram2sapixml/gram2sapixml.txt ???????? - -====================================================================== -? dfa_determinize --- DFA ???????? - -???????????????????????????C -??????????DFA???????? - -mkdfa.pl ????????? DFA ???????C????c??? -????????????????????? DFA ??????????-??????????? - - - ??+?????????????????????????? +?????????? 00readme-ja.txt ???????? Index: julius4/gramtools/00readme.txt diff -u julius4/gramtools/00readme.txt:1.1.1.1 julius4/gramtools/00readme.txt:1.2 --- julius4/gramtools/00readme.txt:1.1.1.1 Fri Sep 28 11:50:55 2007 +++ julius4/gramtools/00readme.txt Thu Oct 2 17:23:45 2008 @@ -9,194 +9,8 @@ gram2sapixml perl script to convert Julian grammar to SAPI XML format dfa_determinize DFA determinizer -To know how to write a grammar for Julian and about the file formats, -please see Grammar.txt for details. +Please see online manual or "00readme.txt" file under each directory. +Other document in Juliusbook or on the Web site will also helps you. -====================================================================== -How to compile + http://julius.sourceforge.jp/en/ -These tools are distributed as part of Julius. Compiling Julius from -the parent directory also compile these tools and install them. - -The below tools and libraries are needed to compile and run these tools. - - - perl (ver.5 and later) - - GNU bison - - GNU flex - - iconv - - Jcode.pm (only for gram2sapixml for Japanese code conversion) - -====================================================================== -====================================================================== - Manuals -====================================================================== -====================================================================== - -====================================================================== -mkdfa.pl --- Grammar compiler - - mkdfa.pl compiles the Julian format grammar (.grammar and - .voca) to Julian native formats (.dfa and .dict). - - Assume the .grammar file and .voca file has the same prefix - (i.e. "foo.grammar" and "foo.voca"), mkdfa.pl compiles them to the - Julian native format in the way below: - - ---------------------------------------------------- - % mkdfa.pl foo - ---------------------------------------------------- - Then it generates files "foo.dfa" and "foo.dict" in the same - directory. It also generates terminal symbol information in - "foo.term" that can be used other grammar tools. - - The mkdfa.pl is a script to spawn the core compile "mkfa", so you - need "mkfa" at the same directory of "mkdfa.pl". - - -====================================================================== -dfa_minimize --- minimize DFA grammar - - This tool will compress the DFA grammar to its equivalent minimal - form. - - dfa_minimize will be automatically used at when generating DFA in - mkdfa.pl. You can still use it separatedly from mkdfa.pl as - described to minimize existing DFAs. - - When invoked from command line, input filename can be specified. - if not specified, dfa_minimize will try to read DFA from standard - input. Also, output filename can be specified with "-o filename". - If not specified, it will output the result to standard output. - ------------------------------------------------------------- - ex.1: % dfa_minimize vfr.dfa -o vfr-min.dfa - - ex.2: % cat vfr.dfa | dfa_minimize > vfr-min.dfa ------------------------------------------------------------- - - -====================================================================== -generate --- Randam sentence generator - - This small program randomly generates sentences that are acceptable - by the given grammar. It can be used to check coverage of a - grammar in a human basis, by looking up if it may generate - non-acceptable sentences. - - .dfa, .dict and .term files are needed to execute. They can be - generated from .grammar and .voca file by mkdfa.pl. - - Options: - "-n num" specifies the number of sentence to be generated - (default: 10) - "-t" output in terminal name rather than word name (needs - .term file) - - ----- Example ------------------------------------------------ - - % generate ../sample_grammars/vfr/vfr - Reading in dictionary...done - Reading in DFA grammar...done - Mapping dict item <-> DFA terminal (category)...done - Reading in term file (optional)...done - 42 categories, 99 words - DFA has 135 nodes and 198 arcs - ----- - (sentences will be generated here...) - - -------------------------------------------------------------- - -====================================================================== -accept_check --- Check acception or rejection of sentences - - "accept_check" is a tool to check whether a sentence (word sequence) is - acceptable on the given grammar. Given a grammar, each input from - the standard input is parsed line by line and output whether they - are acceptable or not. - - .dfa, .dict and .term files are needed to execute. They will be - generated from .grammar and .voca file by mkdfa.pl. - - Usage: the grammar should be specified as the same style as - mkdfa.pl, i.e., the prefix of .dfa, .dict and .term should be - specified. See the examples below. - ----- Example --------------------------------------------- - % bin/accept_check ../sample_grammars/vfr/vfr - Reading in dictionary...done - Reading in DFA grammar...done - Mapping dict item <-> DFA terminal (category)...done - Reading in term file (optional)...done - 42 categories, 99 words - DFA has 135 nodes and 198 arcs - ----- - please input word sequence>silB hello silE <-- input - wseq: silB hello silE - cate: NS_B GREETING NS_E - accepted - please input word sequence> ---------------------------------------------------------- - - Input sentence should be a sequence of space-saprated words. The - short pause model (pronunciation given as "sp") in grammar will be - treated specially to allow skip. - - If there are several words in dictionary that matches the given - word, all the possible combination will be tried to check acceptability. - - Specifying "-t" option at startup time will enable category label as - an input. - - -====================================================================== -nextword --- display next predicted words - - Given a partial (part of) sentence from the end, it outputs - the next words allowed in the specified grammar. - - .dfa, .dict and .term files are needed to execute. They will be - generated from .grammar and .voca file by mkdfa.pl. - - !NOTE! The sentence should be specified from the END OF SENTENCE, - because Julian does right-to-left parsing. - ----- Example --------------------------------------------- - % bin/nextword ../sample_grammars/vfr/vfr - Reading in dictionary...done - Reading in DFA grammar...done - Mapping dict item <-> DFA terminal (category)...done - Reading in term file (optional)...done - 42 categories, 99 words - DFA has 135 nodes and 198 arcs - ----- - wseq > afternoon silE <-- input - [wseq: afternoon silE] - [cate: AFTERNOON NS_E] - PREDICTED CATEGORIES/WORDS: - NS_B (silB) - GOOD (good) - wseq > --------------------------------------------------------- - - You can use completion and history for wseq input, which is a - function of GNU readline library. The important keys are: - - TAB completion of dictionary word. When invoking - with "-t" option, completion will be category name. - Ctrl-P, Ctrl-N history up/down. - -====================================================================== -gram2sapixml --- perl script to convert Julian grammar to SAPI XML format - -See gram2sapixml/gram2sapixml.txt for detail. - -====================================================================== -dfa_determinize --- DFA determinizer - - This tool will determinize the DFA grammar. - - This tools is not used for normal use of DFA, since mkdfa.pl will - generate already determinized DFA. This program can be used for - conversion from other formats. - -*** END OF DOCUMENT From sumomo @ users.sourceforge.jp Thu Oct 2 17:23:46 2008 From: sumomo @ users.sourceforge.jp (sumomo @ users.sourceforge.jp) Date: Thu, 02 Oct 2008 17:23:46 +0900 Subject: [Julius-cvs 276] CVS update: julius4/gramtools/accept_check Message-ID: <1222935826.089127.32246.nullmailer@users.sourceforge.jp> Index: julius4/gramtools/accept_check/00readme-ja.txt diff -u /dev/null julius4/gramtools/accept_check/00readme-ja.txt:1.1 --- /dev/null Thu Oct 2 17:23:46 2008 +++ julius4/gramtools/accept_check/00readme-ja.txt Thu Oct 2 17:23:45 2008 @@ -0,0 +1,79 @@ + accept_check + +ACCEPT_CHECK(1) ACCEPT_CHECK(1) + + + +?? + accept_check + - ????????????/??????? + +?? + accept_check [-t] [-s spname] [-v] {prefix} + +DESCRIPTION + accept_check ????????????????????????????+ ???????????????????????????????????+ ???????accept_check ??????^?????????? + (prefix.dfa ??? prefix.dict) ??????????????????? + ?????????????? + + タ??? .dfa, .dict, .term ???????????? ????? + mkdfa.pl ???????????? + + ???????C???????(.voca??1?????)????????? + ????????????????silB, silE ????????????? + ???????? ?????????????????????? + + ??????????????Caccept_check ???????゚????? + ??????????????????????????????????? + ??????????????????????????? + +OPTIONS + -t + ???????????????????D + + -s spname + ????????????????????????? (default: "sp") + + -v + ??????D + +EXAMPLES + vfr (?????????????) ??タ??? + + % accept_check vfr + Reading in dictionary...done + Reading in DFA grammar...done + Mapping dict item <-> DFA terminal (category)...done + Reading in term file (optional)...done + 42 categories, 99 words + DFA has 135 nodes and 198 arcs + ----- + please input word sequence>silB ? ? ?? ??? silE + wseq: silB ? ? ?? ??? silE + cate: NS_B COLOR_N (NI|NI_AT) SURU_V KUDASAI_V NS_E + accepted + please input word sequence> + + +SEE ALSO + mkdfa.pl ( 1 ) , + generate ( 1 ) , + nextword ( 1 ) + +COPYRIGHT + Copyright (c) 1991-2008 ???? ????コ + + Copyright (c) 1997-2000 ????U?????(IPA) + + Copyright (c) 2000-2008 ?????????w??? ュ???コ + + Copyright (c) 2005-2008 ??????? Julius????? + +LICENSE + Julius ??????????D + + + + 10/02/2008 ACCEPT_CHECK(1) Index: julius4/gramtools/accept_check/00readme.txt diff -u /dev/null julius4/gramtools/accept_check/00readme.txt:1.1 --- /dev/null Thu Oct 2 17:23:46 2008 +++ julius4/gramtools/accept_check/00readme.txt Thu Oct 2 17:23:45 2008 @@ -0,0 +1,80 @@ + accept_check + +ACCEPT_CHECK(1) ACCEPT_CHECK(1) + + + +NAME + accept_check + - Check whether a grammar accept / reject given word sequences + +SYNOPSIS + accept_check [-t] [-s spname] [-v] {prefix} + +DESCRIPTION + accept_check is a tool to check whether a sentence can be accepted or + rejected on a grammar (prefix.dfa and prefix.dict). The sentence should + be given from standard input. You can do a batch check by preparing all + test sentence at each line of a text file, and give it as standard + input of accept_check. + + This tool needs .dfa, .dict and .term files. You should convert a + written grammar file to generate them by mkdfa.pl. + + A sentence should be given as space-separated word sequence. It may be + required to add head / tail silence word like sil, depending on your + grammar. And should not contain a short-pause word. + + When a word belongs to various category in a grammar, accept_check will + check all the possible sentence patterns, and accept it if any of those + is acceptable. + +OPTIONS + -t + Use category name as input instead of word. + + -s spname + Short-pause word name to be skipped. (default: "sp") + + -v + Debug output. + +EXAMPLES + An output for "date" grammar: + + % echo ' NEXT SUNDAY ' | accept_check date + Reading in dictionary... + 143 words...done + Reading in DFA grammar...done + Mapping dict item <-> DFA terminal (category)...done + Reading in term file (optional)...done + 27 categories, 143 words + DFA has 35 nodes and 71 arcs + ----- + wseq: NEXT SUNDAY + cate: NS_B (NEXT|NEXT) (DAYOFWEEK|DAYOFWEEK|DAY|DAY) NS_E + accepted + + +SEE ALSO + mkdfa.pl ( 1 ) , + generate ( 1 ) , + nextword ( 1 ) + +COPYRIGHT + Copyright (c) 1997-2000 Information-technology Promotion Agency, Japan + + Copyright (c) 1991-2008 Kawahara Lab., Kyoto University + + Copyright (c) 2000-2005 Shikano Lab., Nara Institute of Science and + Technology + + Copyright (c) 2005-2008 Julius project team, Nagoya Institute of + Technology + +LICENSE + The same as Julius. + + + + 10/02/2008 ACCEPT_CHECK(1) From sumomo @ users.sourceforge.jp Thu Oct 2 17:23:46 2008 From: sumomo @ users.sourceforge.jp (sumomo @ users.sourceforge.jp) Date: Thu, 02 Oct 2008 17:23:46 +0900 Subject: [Julius-cvs 277] CVS update: julius4/gramtools/dfa_determinize Message-ID: <1222935826.276404.32256.nullmailer@users.sourceforge.jp> Index: julius4/gramtools/dfa_determinize/00readme-ja.txt diff -u /dev/null julius4/gramtools/dfa_determinize/00readme-ja.txt:1.1 --- /dev/null Thu Oct 2 17:23:46 2008 +++ julius4/gramtools/dfa_determinize/00readme-ja.txt Thu Oct 2 17:23:46 2008 @@ -0,0 +1,48 @@ + dfa_determinize + +DFA_DETERMINIZE(1) DFA_DETERMINIZE(1) + + + +?? + dfa_determinize + - ???????????????? + +?? + dfa_determinize [-o outfile] {dfafile} + +DESCRIPTION + dfa_determinize ??.dfa ??????????? .dfa ????????? + ??o???????D????? -o ????????????????? + + + mkdfa.pl ?????DFA???????????C ??Cmkdfa.pl ???? + ?? .dfa ???????? ????????????????? + +OPTIONS + -o outfile + ??t?????????? + +EXAMPLES + foo.dfa ?????? bar.dfa ? ????? + ????? + +SEE ALSO + mkdfa.pl ( 1 ) , + dfa_minimize ( 1 ) + +COPYRIGHT + Copyright (c) 1991-2008 ???? ????コ + + Copyright (c) 1997-2000 ????U?????(IPA) + + Copyright (c) 2000-2008 ?????????w??? ュ???コ + + Copyright (c) 2005-2008 ??????? Julius????? + +LICENSE + Julius ??????????D + + + + 10/02/2008 DFA_DETERMINIZE(1) Index: julius4/gramtools/dfa_determinize/00readme.txt diff -u /dev/null julius4/gramtools/dfa_determinize/00readme.txt:1.1 --- /dev/null Thu Oct 2 17:23:46 2008 +++ julius4/gramtools/dfa_determinize/00readme.txt Thu Oct 2 17:23:46 2008 @@ -0,0 +1,51 @@ + dfa_determinize + +DFA_DETERMINIZE(1) DFA_DETERMINIZE(1) + + + +NAME + dfa_determinize + - Determinize NFA grammar network. + +SYNOPSIS + dfa_determinize [-o outfile] {dfafile} + +DESCRIPTION + dfa_determinize converts a non-deterministic .dfa file into + deterministic DFA. Output to standard output, or file specified by "-o" + option. + + This additional tool is not necessary on a grammar building procedure + in Julius, since the grammar network generated by mkdfa.pl is always + determinized. + +OPTIONS + -o outfile + Outout file. If not specified, output to stdout. + +EXAMPLES + Determinize foo.dfa to bar.dfa: + Another way: + +SEE ALSO + mkdfa.pl ( 1 ) , + dfa_minimize ( 1 ) + +COPYRIGHT + Copyright (c) 1997-2000 Information-technology Promotion Agency, Japan + + Copyright (c) 1991-2008 Kawahara Lab., Kyoto University + + Copyright (c) 2000-2005 Shikano Lab., Nara Institute of Science and + Technology + + Copyright (c) 2005-2008 Julius project team, Nagoya Institute of + Technology + +LICENSE + The same as Julius. + + + + 10/02/2008 DFA_DETERMINIZE(1) From sumomo @ users.sourceforge.jp Thu Oct 2 17:23:46 2008 From: sumomo @ users.sourceforge.jp (sumomo @ users.sourceforge.jp) Date: Thu, 02 Oct 2008 17:23:46 +0900 Subject: [Julius-cvs 278] CVS update: julius4/gramtools/dfa_minimize Message-ID: <1222935826.473788.32265.nullmailer@users.sourceforge.jp> Index: julius4/gramtools/dfa_minimize/00readme-ja.txt diff -u /dev/null julius4/gramtools/dfa_minimize/00readme-ja.txt:1.1 --- /dev/null Thu Oct 2 17:23:46 2008 +++ julius4/gramtools/dfa_minimize/00readme-ja.txt Thu Oct 2 17:23:46 2008 @@ -0,0 +1,49 @@ + dfa_minimize + +DFA_MINIMIZE(1) DFA_MINIMIZE(1) + + + +?? + dfa_minimize + - ????????????????+ +?? + dfa_minimize [-o outfile] {dfafile} + +DESCRIPTION + dfa_minimize ??.dfa ????????????.dfa ????????? + ??o???????D????? -o ????????????????? + + ????? 3.5.3 ??? Julius ???? mkdfa.pl ?? ???????? + ?ゥ?????????C?????.dfa ??????????????? + ???タ????????????????? 3.5.2 ??? mkdfa.pl ???+ ??? .dfa ????????????C ????????????T??? + ????????????? + +OPTIONS + -o outfile + ??t?????????? + +EXAMPLES + foo.dfa ??????bar.dfa ? ????? + ????? + +SEE ALSO + mkdfa.pl ( 1 ) + +COPYRIGHT + Copyright (c) 1991-2008 ???? ????コ + + Copyright (c) 1997-2000 ????U?????(IPA) + + Copyright (c) 2000-2008 ?????????w??? ュ???コ + + Copyright (c) 2005-2008 ??????? Julius????? + +LICENSE + Julius ??????????D + + + + 10/02/2008 DFA_MINIMIZE(1) Index: julius4/gramtools/dfa_minimize/00readme.txt diff -u /dev/null julius4/gramtools/dfa_minimize/00readme.txt:1.1 --- /dev/null Thu Oct 2 17:23:46 2008 +++ julius4/gramtools/dfa_minimize/00readme.txt Thu Oct 2 17:23:46 2008 @@ -0,0 +1,49 @@ + dfa_minimize + +DFA_MINIMIZE(1) DFA_MINIMIZE(1) + + + +NAME + dfa_minimize + - Minimize a DFA grammar network + +SYNOPSIS + dfa_minimize [-o outfile] {dfafile} + +DESCRIPTION + dfa_minimize will convert an .dfa file to an equivalent minimal form. + Output to standard output, or to a file specified by "-o" option. + + On version 3.5.3 and later, mkdfa.pl invokes this tool inside, and the + output .dfa file will be always minimized, so you do not need to use + this manually. + +OPTIONS + -o outfile + Output file. If not specified output to standard output. + +EXAMPLES + Minimize foo.dfa to bar.dfa: + Another way: + +SEE ALSO + mkdfa.pl ( 1 ) + +COPYRIGHT + Copyright (c) 1997-2000 Information-technology Promotion Agency, Japan + + Copyright (c) 1991-2008 Kawahara Lab., Kyoto University + + Copyright (c) 2000-2005 Shikano Lab., Nara Institute of Science and + Technology + + Copyright (c) 2005-2008 Julius project team, Nagoya Institute of + Technology + +LICENSE + The same as Julius. + + + + 10/02/2008 DFA_MINIMIZE(1) From sumomo @ users.sourceforge.jp Thu Oct 2 17:23:46 2008 From: sumomo @ users.sourceforge.jp (sumomo @ users.sourceforge.jp) Date: Thu, 02 Oct 2008 17:23:46 +0900 Subject: [Julius-cvs 279] CVS update: julius4/gramtools/generate Message-ID: <1222935826.660547.32274.nullmailer@users.sourceforge.jp> Index: julius4/gramtools/generate/00readme-ja.txt diff -u /dev/null julius4/gramtools/generate/00readme-ja.txt:1.1 --- /dev/null Thu Oct 2 17:23:46 2008 +++ julius4/gramtools/generate/00readme-ja.txt Thu Oct 2 17:23:46 2008 @@ -0,0 +1,75 @@ + generate + +GENERATE(1) GENERATE(1) + + + +?? + generate + - ?????????????? + +?? + generate [-v] [-t] [-n num] [-s spname] {prefix} + +DESCRIPTION + generate ???????????_???????? + + タ??? .dfa, .dict, .term ???????????? ????? + mkdfa.pl ???????????? + +OPTIONS + -t + ????????????????D + + -n num + ???????????? (default: 10) + + -s spname + ??????????????????????????????? + (default: "sp") + + -v + ??????D + +EXAMPLES + vfr (?????????????) ??タ??? + + % generate vfr + Reading in dictionary...done + Reading in DFA grammar...done + Mapping dict item <-> DFA terminal (category)...done + Reading in term file (optional)...done + 42 categories, 99 words + DFA has 135 nodes and 198 arcs + ----- + silB ???? silE + silB ?????silE + silB ??? ? ??? ? ???? ??? silE + silB ??? ? ???? ? ?? ? ? ???? ??? silE + silB ???? ??? silE + silB ?? ? ?????? ??? silE + silB ?????? ??? silE + silB ??? ??? silE + silB ??? ? ??? ? ???? ??? silE + silB ??? ? ? ?? ??? silE + + +SEE ALSO + mkdfa.pl ( 1 ) , + generate-ngram ( 1 ) + +COPYRIGHT + Copyright (c) 1991-2008 ???? ????コ + + Copyright (c) 1997-2000 ????U?????(IPA) + + Copyright (c) 2000-2008 ?????????w??? ュ???コ + + Copyright (c) 2005-2008 ??????? Julius????? + +LICENSE + Julius ??????????D + + + + 10/02/2008 GENERATE(1) Index: julius4/gramtools/generate/00readme.txt diff -u /dev/null julius4/gramtools/generate/00readme.txt:1.1 --- /dev/null Thu Oct 2 17:23:46 2008 +++ julius4/gramtools/generate/00readme.txt Thu Oct 2 17:23:46 2008 @@ -0,0 +1,76 @@ + generate + +GENERATE(1) GENERATE(1) + + + +NAME + generate + - random sentence generator from a grammar + +SYNOPSIS + generate [-v] [-t] [-n num] [-s spname] {prefix} + +DESCRIPTION + This small program randomly generates sentences that are acceptable by + the given grammar. + + + .dfa, .dict and .term files are needed to execute. They can be + generated from .grammar and .voca file by mkdfa.pl. + +OPTIONS + -t + Output in word's category name. + + -n num + Set number of sentences to be generated (default: 10) + + -s spname + the name string of short-pause word to be supressed (default: "sp") + + -v + Debug output mode. + +EXAMPLES + Exmple output of a sample grammar "fruit": + + % generate fruit + Stat: init_voca: read 36 words + Reading in term file (optional)...done + 15 categories, 36 words + DFA has 26 nodes and 42 arcs + ----- + I WANT ONE APPLE + I WANT TEN PEARS + CAN I HAVE A PINEAPPLE + I WANT ONE PEAR + COULD I HAVE A BANANA + I WANT ONE APPLE PLEASE + I WANT NINE APPLES + NINE APPLES + I WANT ONE PINEAPPLE + I WANT A PEAR + + +SEE ALSO + mkdfa.pl ( 1 ) , + generate-ngram ( 1 ) + +COPYRIGHT + Copyright (c) 1997-2000 Information-technology Promotion Agency, Japan + + Copyright (c) 1991-2008 Kawahara Lab., Kyoto University + + Copyright (c) 2000-2005 Shikano Lab., Nara Institute of Science and + Technology + + Copyright (c) 2005-2008 Julius project team, Nagoya Institute of + Technology + +LICENSE + The same as Julius. + + + + 10/02/2008 GENERATE(1) From sumomo @ users.sourceforge.jp Thu Oct 2 17:23:46 2008 From: sumomo @ users.sourceforge.jp (sumomo @ users.sourceforge.jp) Date: Thu, 02 Oct 2008 17:23:46 +0900 Subject: [Julius-cvs 280] CVS update: julius4/gramtools/gram2sapixml Message-ID: <1222935826.820415.32283.nullmailer@users.sourceforge.jp> Index: julius4/gramtools/gram2sapixml/00readme-ja.txt diff -u /dev/null julius4/gramtools/gram2sapixml/00readme-ja.txt:1.1 --- /dev/null Thu Oct 2 17:23:46 2008 +++ julius4/gramtools/gram2sapixml/00readme-ja.txt Thu Oct 2 17:23:46 2008 @@ -0,0 +1,53 @@ + gram2sapixml.pl + +GRAM2SAPIXML.PL(1) GRAM2SAPIXML.PL(1) + + + +?? + gram2sapixml.pl + - ?ッ???? SAPI XML ???????????? + +?? + gram2sapixml.pl [prefix...] + +DESCRIPTION + gram2sapixml.pl ??Julius ??ッ??????? (.grammar, .voca) ?? + Microsoft SAPI XML ?ョ????????????? prefix ??????? + .grammar, .voca ?? ???????????????O????????? + ??????????C ????????????? + + ???????? EUC-JP???????????t???? UTF-8 ???? + ?????????????????? iconv ??? ?????? + + ??????????????????K?????????? .grammar ? + ??????????????.grammar ??????????A?????+ ?? .xml ????????????????? .xml ?????????? + ??????????????????? + +SEE ALSO + mkdfa.pl ( 1 ) + +DIAGNOSTICS + ???????????????[????[??(???????)???? + ???????????????Dタ??SAPI??????????????+ ???????????????????????K???? + + ????????? iconv ????????? タ?????iconv ????+ ??????????? + +COPYRIGHT + Copyright (c) 1991-2008 ???? ????コ + + Copyright (c) 1997-2000 ????U?????(IPA) + + Copyright (c) 2000-2008 ?????????w??? ュ???コ + + Copyright (c) 2005-2008 ??????? Julius????? + +LICENSE + Julius ??????????D + + + + 10/02/2008 GRAM2SAPIXML.PL(1) Index: julius4/gramtools/gram2sapixml/00readme.txt diff -u /dev/null julius4/gramtools/gram2sapixml/00readme.txt:1.1 --- /dev/null Thu Oct 2 17:23:46 2008 +++ julius4/gramtools/gram2sapixml/00readme.txt Thu Oct 2 17:23:46 2008 @@ -0,0 +1,55 @@ + gram2sapixml.pl + +GRAM2SAPIXML.PL(1) GRAM2SAPIXML.PL(1) + + + +NAME + gram2sapixml.pl + - convert Julius grammar to SAPI XML grammar format + +SYNOPSIS + gram2sapixml.pl [prefix...] + +DESCRIPTION + gram2sapixml.pl converts a recognition grammar file of Julius + (.grammar, .voca) to Microsoft SAPI XML grammar format. prefix should + be a file name of target grammar, excluding suffixes. If multiple + argument is given, each will be process sequencialy in turn. + + The internal character set should be in UTF-8 format. By default + gram2sapixml.pl assume input in EUC-JP encoding and tries to convert it + to UTF-8 using iconv. You may want to disable this feature within the + script. + + It will fail to convert a left recursive rule in the grammar. When + fails, it will leave the source rules in the target .xml file, so you + should modify the output manually to solve it. + +SEE ALSO + mkdfa.pl ( 1 ) + +DIAGNOSTICS + The conversion procedure is somewhat dumb one, only converting the + non-terminal symbols and terminal symbols (=word category name) into + corresponding rules one by one. This is only a help tool, and you will + need a manual inspection and editing to use it on a real SAPI + application. + +COPYRIGHT + Copyright (c) 1997-2000 Information-technology Promotion Agency, Japan + + Copyright (c) 1991-2008 Kawahara Lab., Kyoto University + + Copyright (c) 2000-2005 Shikano Lab., Nara Institute of Science and + Technology + + Copyright (c) 2005-2008 Julius project team, Nagoya Institute of + Technology + +LICENSE + The same as Julius. + + + + 10/02/2008 GRAM2SAPIXML.PL(1) From sumomo @ users.sourceforge.jp Thu Oct 2 17:23:46 2008 From: sumomo @ users.sourceforge.jp (sumomo @ users.sourceforge.jp) Date: Thu, 02 Oct 2008 17:23:46 +0900 Subject: [Julius-cvs 281] CVS update: julius4/gramtools/mkdfa Message-ID: <1222935826.987935.32298.nullmailer@users.sourceforge.jp> Index: julius4/gramtools/mkdfa/00readme-ja.txt diff -u /dev/null julius4/gramtools/mkdfa/00readme-ja.txt:1.1 --- /dev/null Thu Oct 2 17:23:46 2008 +++ julius4/gramtools/mkdfa/00readme-ja.txt Thu Oct 2 17:23:46 2008 @@ -0,0 +1,72 @@ + mkdfa.pl + +MKDFA.PL(1) MKDFA.PL(1) + + + +?? + mkdfa.pl + - Julius ?ョ???????????????????? + +?? + mkdfa.pl [options...] {prefix} + +DESCRIPTION + mkdfa.pl ? Julius ?????????????????@???? + (.grammar) ??????? (.voca) ???Julius??????I????? + ???? (.dfa) ????ッォ?(.dict) ??????????????? + ????????????????? ID ??????? .term ????? + ????????D + + ??????ョ????????C??????????????? + + + prefix ??.grammar ??????? .voca????? ?????????? + ????????prefix.grammar? prefix.voca??prefix.dfa? + prefix.dict??? prefix.term???????? + + ????? 3.5.3 ??? Julius ???? mkdfa.pl ?? dfa_minimize ?? + ??ゥ?????????C ?????.dfa ????????????D + +OPTIONS + -n + ォ??o?????.voca ??? .grammar ??? .dfa ????? ?? + ????? + +ENVIRONMENT VARIABLES + TMP ??? TEMP + ????????????????????????? ???????C + /tmp, /var/tmp, /WINDOWS/Temp, /WINNT/Temp ????????????+ ??g????? + +EXAMPLES + ?????? foo.grammar, foo.voca? ??????タ?????? foo.dfa + ? foo.voca???foo.term??????D + +SEE ALSO + julius ( 1 ) , + generate ( 1 ) , + nextword ( 1 ) , + accept_check ( 1 ) , + dfa_minimize ( 1 ) + +DIAGNOSTICS + mkdfa.pl ???? mkfa ??? dfa_minimize ???????Dタ????? + ??タ??? ?????? mkdfa.pl ?????????????????? + ????? ????Julius ?????????? + +COPYRIGHT + Copyright (c) 1991-2008 ???? ????コ + + Copyright (c) 1997-2000 ????U?????(IPA) + + Copyright (c) 2000-2008 ?????????w??? ュ???コ + + Copyright (c) 2005-2008 ??????? Julius????? + +LICENSE + Julius ??????????D + + + + 10/02/2008 MKDFA.PL(1) Index: julius4/gramtools/mkdfa/00readme.txt diff -u /dev/null julius4/gramtools/mkdfa/00readme.txt:1.1 --- /dev/null Thu Oct 2 17:23:46 2008 +++ julius4/gramtools/mkdfa/00readme.txt Thu Oct 2 17:23:46 2008 @@ -0,0 +1,67 @@ + mkdfa.pl + +MKDFA.PL(1) MKDFA.PL(1) + + + +NAME + mkdfa.pl + - grammar compiler + +SYNOPSIS + mkdfa.pl [options...] {prefix} + +DESCRIPTION + mkdfa.pl compiles the Julian format grammar (.grammar and .voca) to + Julian native formats (.dfa and .dict). In addition, ".term" will be + also generated that stores correspondence of category ID used in the + output files to the source category name. + + + prefix should be the common file name prefix of ".grammar" and "voca" + file. From prefix.grammar and prefix.voca file, prefix.dfa, prefix.dict + and prefix.term will be output. + +OPTIONS + -n + Not process dictionary. You can only convert .grammar file to .dfa + file without .voca file. + +ENVIRONMENT VARIABLES + TMP or TEMP + Set directory to store temporal file. If not specified, one of them + on the following list will be used: /tmp, /var/tmp, /WINDOWS/Temp, + /WINNT/Temp. + +EXAMPLES + Convert a grammar foo.grammar and foo.voca to foo.dfa, foo.voca and + foo.term. + +SEE ALSO + julius ( 1 ) , + generate ( 1 ) , + nextword ( 1 ) , + accept_check ( 1 ) , + dfa_minimize ( 1 ) + +DIAGNOSTICS + mkdfa.pl invokes mkfa and dfa_minimize internally. They should be + placed at the same directory as mkdfa.pl. + +COPYRIGHT + Copyright (c) 1997-2000 Information-technology Promotion Agency, Japan + + Copyright (c) 1991-2008 Kawahara Lab., Kyoto University + + Copyright (c) 2000-2005 Shikano Lab., Nara Institute of Science and + Technology + + Copyright (c) 2005-2008 Julius project team, Nagoya Institute of + Technology + +LICENSE + The same as Julius. + + + + 10/02/2008 MKDFA.PL(1) From sumomo @ users.sourceforge.jp Thu Oct 2 17:23:47 2008 From: sumomo @ users.sourceforge.jp (sumomo @ users.sourceforge.jp) Date: Thu, 02 Oct 2008 17:23:47 +0900 Subject: [Julius-cvs 282] CVS update: julius4/gramtools/nextword Message-ID: <1222935827.153182.32308.nullmailer@users.sourceforge.jp> Index: julius4/gramtools/nextword/00readme-ja.txt diff -u /dev/null julius4/gramtools/nextword/00readme-ja.txt:1.1 --- /dev/null Thu Oct 2 17:23:47 2008 +++ julius4/gramtools/nextword/00readme-ja.txt Thu Oct 2 17:23:47 2008 @@ -0,0 +1,84 @@ + nextword + +NEXTWORD(1) NEXTWORD(1) + + + +?? + nextword + - DFA ???????????????????? + +?? + nextword [-t] [-r] [-s spname] [-v] {prefix} + +DESCRIPTION + nextword ??mkdfa.pl ????????? DFA ?? ??C??????? + ?????????????????o????? + + タ??? .dfa, .dict, .term ???????????? ????? + mkdfa.pl ???????????? + + ???? mkdfa.pl ???????@???? ?????????????? + ?????????????????? ????Julius ??2??????? + ??????????? ?????nextword ?????????????? + ??? + +OPTIONS + -t + ???????????????????D + + -r + ??????????D + + -s spname + ????????????????????????? (default: "sp") + + -v + ??????D + +EXAMPLES + vfr (?????????????) ??タ??? + + % nextword vfr + Reading in dictionary...done + Reading in DFA grammar...done + Mapping dict item <-> DFA terminal (category)...done + Reading in term file (optional)...done + 42 categories, 99 words + DFA has 135 nodes and 198 arcs + ----- + wseq > ? ?? ??? silE + [wseq: ? ?? ??? silE] + [cate: (NI|NI_AT) SURU_V KUDASAI_V NS_E] + PREDICTED CATEGORIES/WORDS: + KEIDOU_A (?? ?? ) + BANGOU_N (? ) + HUKU_N (? ?? ?? ) + PATTERN_N (???? ???ネ ...) + GARA_N (? ) + KANZI_N (?? ) + IRO_N (? ) + COLOR_N (? ? ? ...) + wseq > + + +SEE ALSO + mkdfa.pl ( 1 ) , + generate ( 1 ) , + accept_check ( 1 ) + +COPYRIGHT + Copyright (c) 1991-2008 ???? ????コ + + Copyright (c) 1997-2000 ????U?????(IPA) + + Copyright (c) 2000-2008 ?????????w??? ュ???コ + + Copyright (c) 2005-2008 ??????? Julius????? + +LICENSE + Julius ??????????D + + + + 10/02/2008 NEXTWORD(1) Index: julius4/gramtools/nextword/00readme.txt diff -u /dev/null julius4/gramtools/nextword/00readme.txt:1.1 --- /dev/null Thu Oct 2 17:23:47 2008 +++ julius4/gramtools/nextword/00readme.txt Thu Oct 2 17:23:47 2008 @@ -0,0 +1,82 @@ + nextword + +NEXTWORD(1) NEXTWORD(1) + + + +NAME + nextword + - display next predicted words (in reverse order) + +SYNOPSIS + nextword [-t] [-r] [-s spname] [-v] {prefix} + +DESCRIPTION + Given a partial (part of) sentence from the end, it outputs the next + words allowed in the specified grammar. + + + .dfa, .dict and .term files are needed to execute. They can be + generated from .grammar and .voca file by mkdfa.pl. + + Please note that the latter part of sentence should be given, since the + main 2nd pass does a right-to-left parsing. + +OPTIONS + -t + Input / Output in category name. (default: word) + + -r + Enter in reverse order + + -s spname + the name string of short-pause word to be supressed (default: "sp") + + -v + Debug output. + +EXAMPLES + Exmple output of a sample grammar "fruit": + + % nextword fruit + Stat: init_voca: read 36 words + Reading in term file (optional)...done + 15 categories, 36 words + DFA has 26 nodes and 42 arcs + ----- + command completion is disabled + ----- + wseq > A BANANA + [wseq: A BANANA ] + [cate: (NUM_1|NUM_1|A|A) FRUIT_SINGULAR NS_E] + PREDICTED CATEGORIES/WORDS: + NS_B ( ) + HAVE (HAVE ) + WANT (WANT ) + NS_B ( ) + HAVE (HAVE ) + WANT (WANT ) + + +SEE ALSO + mkdfa.pl ( 1 ) , + generate ( 1 ) , + accept_check ( 1 ) + +COPYRIGHT + Copyright (c) 1997-2000 Information-technology Promotion Agency, Japan + + Copyright (c) 1991-2008 Kawahara Lab., Kyoto University + + Copyright (c) 2000-2005 Shikano Lab., Nara Institute of Science and + Technology + + Copyright (c) 2005-2008 Julius project team, Nagoya Institute of + Technology + +LICENSE + The same as Julius. + + + + 10/02/2008 NEXTWORD(1) From sumomo @ users.sourceforge.jp Thu Oct 2 17:23:47 2008 From: sumomo @ users.sourceforge.jp (sumomo @ users.sourceforge.jp) Date: Thu, 02 Oct 2008 17:23:47 +0900 Subject: [Julius-cvs 283] CVS update: julius4/jclient-perl Message-ID: <1222935827.314582.32317.nullmailer@users.sourceforge.jp> Index: julius4/jclient-perl/00readme-ja.txt diff -u julius4/jclient-perl/00readme-ja.txt:1.1 julius4/jclient-perl/00readme-ja.txt:1.2 --- julius4/jclient-perl/00readme-ja.txt:1.1 Tue Sep 16 12:55:48 2008 +++ julius4/jclient-perl/00readme-ja.txt Thu Oct 2 17:23:47 2008 @@ -1,21 +1,47 @@ -jclient.pl -============ + jclient.pl -Julius ?????????????? "jcontrol" ? Perl ???? -???????????????? Julius ???ッ?????????? -Julius ??????????? +JCLIENT.PL(1) JCLIENT.PL(1) -??? 57 ?????????????????????? Julius ???? -???????????????ゥ?????????? ---- -jclient.pl ? ???? ?? (nisimura @ sys.wakayama-u.ac.jp) ????? -????????????????????????メ??????????-???ゥ??????????????? +?? + jclient.pl + - perl ??????????? -??????????????????????????????? -?L???????????????????????????? +?? + jclient.pl - http://w3voice.jp/ +DESCRIPTION + Julius ?????????????? "jcontrol" ? Perl ???? ? + ??????????????? Julius ???ッ?????????? + Julius ??????????? + ??? 57 ?????????????????????? Julius ???? + ???????????????ゥ?????????? + +EXAMPLES + ?L?????? Julius ????????????????jclient.pl ? + ???????????????????? localhost, ?????? 10500 + ??????????X?????????????????D + ??????????????????? jclient.pl ??????? ??o + ????????D???jclient.pl ????????????? ???? + Enter ??????Julius ???????????Julius ???????? + ?????????????W?????????????????D + +SEE ALSO + julius ( 1 ) , + jcontrol ( 1 ) + +COPYRIGHT + jclient.pl ? ???? ?? (nisimura @ sys.wakayama-u.ac.jp) ????? + ????????????????????????メ??????????+ ???ゥ??????????????? + + ??????????????????????????????? ?L?? + ?????????????????????????? + + http://w3voice.jp/ + + + + 10/02/2008 JCLIENT.PL(1) Index: julius4/jclient-perl/00readme.txt diff -u julius4/jclient-perl/00readme.txt:1.1 julius4/jclient-perl/00readme.txt:1.2 --- julius4/jclient-perl/00readme.txt:1.1 Tue Sep 16 12:55:48 2008 +++ julius4/jclient-perl/00readme.txt Thu Oct 2 17:23:47 2008 @@ -1,19 +1,46 @@ -jclient.pl -============ + jclient.pl -This is a perl version of "jcontrol". -You can receive recognition result from Julius running in module mode, -or send command to Julius. +JCLIENT.PL(1) JCLIENT.PL(1) -You can use this tiny program for free. ---- -"jclient.pl" has been developed by Dr. Ryuichi Nisimura -(nisimura @ sys.wakayama-u.ac.jp). Use at your own risk. +NAME + jclient.pl + - sample client for module mode (perl version) -If you have any feedback, comment or request, please contact the -E-mail address above, or look at the Web page below. +SYNOPSIS + jclient.pl - http://w3voice.jp/ +DESCRIPTION + This is yet another sample client written in perl. It will connect to + Julius running in module mode, receive recognition results from Julius, + and cna send commands to control Julius. + This is a tiny program with only 57 lines. You can use it for free. + +EXAMPLES + Invoke Julius with module mode by specifying "-module" option: + Then, at other terminal or other host, invoke jclient.pl like below. + The default hostname is "localhost", and port number is 10500. You can + change them by editing the top part of the script. + It will then receive the outputs of Julius and output the raw message + to standard out. Also, by inputting a raw module command to the + standard input of jclient.pl, it will be sent to Julius. See manuals + for the specification of module mode. + +SEE ALSO + julius ( 1 ) , + jcontrol ( 1 ) + +COPYRIGHT + "jclient.pl" has been developed by Dr. Ryuichi Nisimura + (nisimura @ sys.wakayama-u.ac.jp). Use at your own risk. + + If you have any feedback, comment or request, please contact the E-mail + address above, or look at the Web page below. + + http://w3voice.jp/ + + + + 10/02/2008 JCLIENT.PL(1) From sumomo @ users.sourceforge.jp Thu Oct 2 17:23:47 2008 From: sumomo @ users.sourceforge.jp (sumomo @ users.sourceforge.jp) Date: Thu, 02 Oct 2008 17:23:47 +0900 Subject: [Julius-cvs 284] CVS update: julius4/jcontrol Message-ID: <1222935827.520576.32330.nullmailer@users.sourceforge.jp> Index: julius4/jcontrol/00readme-ja.txt diff -u julius4/jcontrol/00readme-ja.txt:1.2 julius4/jcontrol/00readme-ja.txt:1.3 --- julius4/jcontrol/00readme-ja.txt:1.2 Tue Dec 18 23:08:22 2007 +++ julius4/jcontrol/00readme-ja.txt Thu Oct 2 17:23:47 2008 @@ -1,157 +1,173 @@ + jcontrol + JCONTROL(1) JCONTROL(1) -NAME - jcontrol - simple program to control Julius module via API +?? + jcontrol + - Julius???????????????????? -SYNOPSIS - jcontrol hostname [portnum] +?? + jcontrol {hostname} [portnum] DESCRIPTION - jcontrol ???????????? julius ??API??????????? - ????????????????? Julius ??? ? ? ? ? ?? ? ? - ?Julius????????????????????? - - ????jcontrol ????????????u?????????????? - Julius ??????????????????jcontrol ???????? ? - ??????????????D + jcontrol ????????????????? julius ?????API??? + ?????????????????????????Julius ?????? + ????????????????? Julius ????ッ????????? + ? ?????????????????? + + ????jcontrol ????????????u????????????? + ?Julius ??????????????????jcontrol ???????? + ?????????????????????????D - jcontrol ? ???????????????゚??????API????? - Julius ??????????Julius ???ッ??????????? ? ? + jcontrol ? ???????????????゚??????API????? + Julius ??????????Julius ???ッ???????????? ? ????????????????????????o????o???? - API?????????A????????D + ???????????????????????????D OPTIONS - hostname - ?????????Julius ?????????????? - - portnum - (optional) ????? (default=10500) + hostname + ???????? -COMMANDS (COMMON) - ? ? ??jcontrol ??????????????????????????- ?? + portnum + ????????????10500? - pause ?ッ???????ッ?????C???????????2??? ? - ?ッ????????f??? +COMMANDS + jcontrol ??????????????????????? ??????? + ??????? + + ???? + pause + Julius??ッ????????????????s?????????? + ???Julius???????????????ッ???s???? ??? + ?????ッ???r????????????????C Julius ??? + ?ッ???I?????????????s??? terminate - ?ッ???????ッ?????C?????????????? - resume ?ッ???? + pause?????Julius??ッ???????? ????????s?? + ??????????ッ???r????? ???????????C? + ??????????????????????? + + resume + Julius ???????????????s????ッ??????? inputparam arg - ? ? ??????????????????????????w?? - "TERMINATE", "PAUSE", "WAIT"??????????? + ????????????????????????????w?? + "TERMINATE", "PAUSE", "WAIT"??????????? version - ??????????? - - status ???????active/sleep)???? + Julius ??????????????? -GRAMMAR COMMANDS - ??????ッ????????? + status + Julius ?????????(active / sleep) ??????? + ??????ッ?? changegram prefix - ?ッ??? "prefix.dfa" ? "prefix.dict" ?????????? ? - ???????????????C?????????????? + ?ッ??? "prefix.dfa" ? "prefix.dict" ????????????? + ?????????????C?????????????? addgram prefix - ?ッ????? "prefix.dfa" ? "prefix.dict" ?????? + ?ッ????? "prefix.dfa" ? "prefix.dict" ??????????? + ???? - deletegram ID - ?????ID??ッ???????D??????????????? - ?????DID ? Julian ?????? GRAMINFO ???????? - ?? - - deactivategram ID - ?????ID??ッ????????OFF????OFF???????? - ッ??????I??O??????OFF??????? Julius ? ? - ????? "activategram" ??????? ON ????? + deletegram gramlist + ??????????????????????D???????? ?? + ????? prefix??????? Julius ?????? GRAMINFO???? + ?? ID ????????????????????C???????ID? + ? ??????????????ID?????????????? + + deactivategram gramlist + ????????????????????????????????? + ???????????????????ッ???????I??O?? + ?? ????????? activategram ?????????? + + ??????????????? prefix???????Julius ???? + ?? GRAMINFO?????? ID ??????? ????????????+ ?????????ID????????? ???????ID?????? + ???????? + + activategram gramlist + ?????????????????????????? ??????? + ???????? prefix???????Julius ???? ?? GRAMINFO? + ????? ID ??????? ?????????????C????? + ??ID????????? ???????ID??????????? + ??? - activategram ID - ???? OFF ??????????? ON ???? + addword grammar_name_or_id dictfile + dictfile ??????????????????????????? syncgram - ??????????????? + addgram ? deletegram ????????????????? ????? + ???? + + ??????????? + Julius-4 ???????????ッ?????????C ?ッ???? + ("-SR" ???????ッ??C?????) ??????????????? + ????????????? + + ????????????????????????????????? ?? + ??????????????????????????????? -COMMANDS (PROCESS) listprocess - ??????????ッ????????ヲ?? + Julius ???????????ッ?????????????? - currentprocess name - ?????タ??????J??????????????????? - ?? + currentprocess procname + ???????????????????????????? shiftprocess - ?????タ??????J??????????????D + ?????????????????D???????????????? + ??????????????? addprocess jconffile - ??????ッ??????????jconffile ???? LM ???? - ????????????????????????? LM ????ッ - ????? jconffile ????????????? - - delprocess name - ?????????ッ???????????????D + ??????ッ???????????????? jconffile ?????+ ?????? ?????? LM ??????????????????? + タ?????? ????????????????????Julius??? + ?????? ??????? Julius ????????w??????? + ?? + + ????? LM ????ッ??????jconffile ???? ?????? + ??? + + delprocess procname + ?????????ッ???????????????D + + deactivateprocess procname + ?????????ッ????????????????????? ?? + ????????????????ッ????X??????? ???? + ??????? activateprocess ? ????????? - activateprocess name - ???????????????????????? + activateprocess procname + ?????????ッ??????????? - deactivateprocess name - ?????????????????? - - addword gram_id dictfile - dictfile??????????????? gram_id ???? ? ? ? - ?????????ッ??? - -EXAMPLE +EXAMPLES Julius ????????? "> " ???????????????o????- ????????e????????C?????Q???????D - - (1) Julius ????????????? host ?????? - % julius -C xxx.jconf ... -input mic -module - - (2) (?????) jcontrol ????????????? - % jcontrol host - connecting to host:10500...done - > - > # 0: [active] 99words, 42categories, 135nodes (new) - > - > - > # 0: [active] 99words, 42categories, 135 nodes - > Grobal: 99words, 42categories, 135nodes - > - > - -> pause - -> resume - > - -> addgram test - .... + ????????タ????? + ?L?????? Julius ???????????????? jcontrol ?? + ???????????????? + ??????????????????? jcontrol ????????? + jcontrol ????????????????? Enter ?????? Julius + ???????????Julius ???????? + ???v???????????????Q???????D SEE ALSO - julius(1) + julius ( 1 ) -BUGS - ??????????????? ? ? ? julius-info at lists.source- - forge.jp ????????? +COPYRIGHT + Copyright (c) 1991-2008 ???? ????コ -VERSION - This version is provided as part of Julius-3.5.1. + Copyright (c) 1997-2000 ????U?????(IPA) -COPYRIGHT - Copyright (c) 2002-2007 ???? ????コ - Copyright (c) 2002-2005 ?????????w??? ュ???コ - Copyright (c) 2005-2007 ??????? Julius????? + Copyright (c) 2000-2008 ?????????w??? ュ???コ -AUTHORS - ? ?? (???????) ?タ?????? + Copyright (c) 2005-2008 ??????? Julius????? LICENSE Julius ??????????D -4.3 Berkeley Distribution LOCAL JCONTROL(1) + 10/02/2008 JCONTROL(1) Index: julius4/jcontrol/00readme.txt diff -u julius4/jcontrol/00readme.txt:1.2 julius4/jcontrol/00readme.txt:1.3 --- julius4/jcontrol/00readme.txt:1.2 Tue Dec 18 23:08:22 2007 +++ julius4/jcontrol/00readme.txt Thu Oct 2 17:23:47 2008 @@ -1,162 +1,173 @@ + jcontrol + JCONTROL(1) JCONTROL(1) NAME - jcontrol - simple program to control Julius module via API + jcontrol + - a sample module client written in C SYNOPSIS - jcontrol hostname [portnum] + jcontrol {hostname} [portnum] DESCRIPTION jcontrol is a simple console program to control julius running on other - host via network API. It can send command to Julius, and receive mes- - sages from Julius. + host via network API. It can send command to Julius, and receive + messages from Julius. - When invoked, jcontrol tries to connect to Julius running in "module - mode" on specified hostname. After connection established, jcontrol + When invoked, jcontrol tries to connect to Julius running in "module + mode" on specified hostname. After connection established, jcontrol waits for user commands from standard input. - When user types a command to jcontrol, it will be interpreted and cor- - responding API command will be sent to Julius. When a message is + When user types a command to jcontrol, it will be interpreted and cor- + responding API command will be sent to Julius. When a message is received from Julius, its content will be output to standard output. - For details about the API, see the related documents. + For the details about the API, see the related documents. OPTIONS - hostname - Host name where Julius is runnning in module mode. - - portnum - (optional) port number. (default=10500) + hostname + Host name where Julius is runnning in module mode. -COMMANDS (COMMON) - After startup, the command string below can be input from stdin. + portnum + port number (default: 10500) - pause Stop recognition, cutting speech input at that point if any. +COMMANDS + jcontrol interprets commands from standard input. Below is a list of + all commands. + + Engine control + pause + Stop Julius and enter into paused status. In paused status, Julius + will not run recognition even if speech input occurs. When this + command is issued while recognition is running, Julius will stop + after the recognition has been finished. terminate - Stop recognition, discarding the current speech input if any. + Same as pause, but discard the current speech input when received + command in the middle of recognition process. - resume (re)start recognition. + resume + Restart Julius that has been paused or terminated. inputparam arg - Tell Julius how to deal with speech input in case grammar is - changed just when recognition is running. Specify one: "TERMI- - NATE", "PAUSE", "WAIT" + Tell Julius how to deal with speech input in case grammar is changed + just when recognition is running. Specify one: "TERMINATE", "PAUSE" + or "WAIT". version - Return version number. - - status Return trigger status (active/sleep). + Tell Julius to send version description string. -COMMANDS (GRAMMAR) - Below are Grammar-related command strings: + status + Tell Julius to send the system status (active / sleep) + Grammar handling changegram prefix - Change recognition grammar to "prefix.dfa" and "prefix.dict". - All the current grammars used in Julius are deleted and replaced - to the specifed grammar. + Send a new grammar "prefix.dfa" and "prefix.dict", and tell julius + to use it as a new grammar. All the current grammars used in the + current process of Julius will be deleted and replaced to the + specifed grammar. addgram prefix - tell Julius to use additional grammar "prefix.dfa" and "pre- - fix.dict" for recognition. The specified grammars are added to - the list of recognition grammars, and then activated. - - deletegram ID - tell Julius to delete grammar of the specified "ID". The - deleted grammar will be erased from Julius. The grammar "ID" is - sent from Julius at each time grammar information has changed. - - deactivategram ID - tell Julius to de-activate a grammar. The specified grammar - will become temporary OFF, and skipped from recognition process. - These de-activated grammars are kept in Julius, and can be acti- - vated by "activategram" command. + Send a new grammar "prefix.dfa" and "prefix.dict" and add it to the + current grammar. - activategram ID - tell Julius to activate previously de-activated grammar. + deletegram gramlist + Tell Julius to delete existing grammar. The grammar can be specified + by either prefix name or number ID. The number ID can be determined + from the message sent from Julius at each time grammar information + has changed. When want to delete more than one grammar, specify all + of them as comma-sparated. + + deactivategram gramlist + Tell Julius to de-activate a specified grammar. The specified + grammar will still be kept but will not be used for recognition. + + The target grammar can be specified by either prefix name or number + ID. The number ID can be determined from the message sent from + Julius at each time grammar information has changed. When want to + delete more than one grammar, specify all of them as comma-sparated. + + activategram gramlist + Tell Julius to activate previously de-activated grammar. The target + grammar can be specified by either prefix name or number ID. The + number ID can be determined from the message sent from Julius at + each time grammar information has changed. When want to delete more + than one grammar, specify all of them as comma-sparated. + + addword grammar_name_or_id dictfile + Add the recognition word entries in the specified dictfile to the + specified grammar on current process. syncgram - tell Julius to update grammar status now. + Force synchronize grammar status, like unix command "sync". + + Process management + Julius-4 supports multi-model recognition nad multi decoding. In this + case it is possible to control each recognition process, as defined by + "-SR" option, from module client. + + In multi decoding mode, the module client holds "current process", and + the process commands and grammar related commands will be issued toward + the current process. -COMMANDS (PROCESS) listprocess - returns list of existing recognition process. + Tell Julius to send the list of existing recognition process. - currentprocess name - switches the currently manipulating process to it. + currentprocess procname + Switch the current process to the process specified by the name. shiftprocess - rotate the curenttly manipulating process. + Rotate the current process. At each call the current process will be + changed to the next one. addprocess jconffile - adds a set of LM process SR process to the running engine. The - jconf file should contain only one LM specification, and can be - an accessible path at the server. The new processes will have - the name of the jconf file. - - delprocess name - removes a SR process with specified name from engine. - - activateprocess name - enables a SR process previously deactivated and turn it into - live status. - - deactivateprocess name - disables a specified SR process and turn it into dead status. - - addword gram_id dictfile - Send words in the dictfile to engine and add them to the grammar - specified by gram_id at current process. - -EXAMPLE - The dump messages from Julius are output to tty with prefix "> " - appended to each line. - - See related documents for more details. - - (1) start Julius in module mode at host 'host'. - % julius -C xxx.jconf ... -input mic -module - - (2) (on other tty) start jcontrol, and start communication. - % jcontrol host - connecting to host:10500...done - > - > # 0: [active] 99words, 42categories, 135nodes (new) - > - > - > # 0: [active] 99words, 42categories, 135 nodes - > Grobal: 99words, 42categories, 135nodes - > - > - -> pause - -> resume - > - -> addgram test - .... - + Tell Julisu to load a new recognition process into engine. The + argument jconffile should be a jconf file that contains only one set + of LM options and one SR definition. Note that the file should be + visible on the running Julius, since jcontrol only send the path + name and Julius actually read the jconf file. + + The new LM and SR process will have the name of the jconffile. + + delprocess procname + Delete the specified recognition process from the engine. + + deactivateprocess procname + Tell Julius to temporary stop the specified recognition process. The + stopped process will not be executed for the input until activated + again. + + activateprocess procname + Tell Julius to activate the temporarily stopped process. + +EXAMPLES + The dump messages from Julius are output to tty with prefix ">" + appended to each line. Julius can be started in module mode like this: + jcontrolcan be launched with the host name: + It will then receive the outputs of Julius and output the raw message + to standard out. Also, by inputting the commands above to the standard + input of jcontrol, it will be sent to Julius. See manuals for the + specification of module mode. SEE ALSO - julius(1) - -VERSION - This version is provided as part of Julius-4.0. + julius ( 1 ) COPYRIGHT - Copyright (c) 2002-2007 Kawahara Lab., Kyoto University - Copyright (c) 2002-2005 Shikano Lab., Nara Institute of Science and + Copyright (c) 1997-2000 Information-technology Promotion Agency, Japan + + Copyright (c) 1991-2008 Kawahara Lab., Kyoto University + + Copyright (c) 2000-2005 Shikano Lab., Nara Institute of Science and Technology - Copyright (c) 2005-2007 Julius project team, Nagoya Institute of Tech- - nology -AUTHORS - LEE Akinobu (Nagoya Institute of Technology, Japan) - contact: julius-info at lists.sourceforge.jp + Copyright (c) 2005-2008 Julius project team, Nagoya Institute of + Technology LICENSE - Same as Julius. + The same as Julius. -4.3 Berkeley Distribution LOCAL JCONTROL(1) + 10/02/2008 JCONTROL(1) Index: julius4/jcontrol/jcontrol.man diff -u julius4/jcontrol/jcontrol.man:1.2 julius4/jcontrol/jcontrol.man:removed --- julius4/jcontrol/jcontrol.man:1.2 Tue Dec 18 23:08:22 2007 +++ julius4/jcontrol/jcontrol.man Thu Oct 2 17:23:47 2008 @@ -1,143 +0,0 @@ -.de Sp -.if t .sp .5v -.if n .sp -.. -.de Ip -.br -.ie \\n.$>=3 .ne \\$3 -.el .ne 3 -.IP "\\$1" \\$2 -.. -.TH JCONTROL 1 LOCAL -.UC 6 -.SH NAME -jcontrol - simple program to control Julius module via API -.SH SYNOPSIS -.B jcontrol hostname [portnum] -.SH DESCRIPTION -.I jcontrol -is a simple console program to control -.I julius -running on other host via network API. It can send command to Julius, -and receive messages from Julius. -.PP -When invoked, jcontrol tries to connect to Julius running in -"module mode" on specified hostname. After connection established, -jcontrol waits for user commands from standard input. -.PP -When user types -a command to jcontrol, it will be interpreted and corresponding API -command will be sent to Julius. When a message is received from -Julius, its content will be output to standard output. -.PP -For details about the API, see the related documents. -.SH "OPTIONS" -.Ip hostname -Host name where Julius is runnning in module mode. -.Ip portnum -(optional) port number. (default=10500) -.SH "COMMANDS (COMMON)" -After startup, the command string below can be input from stdin. -.Ip "pause" -Stop recognition, cutting speech input at that point if any. -.Ip "terminate" -Stop recognition, discarding the current speech input if any. -.Ip "resume" -(re)start recognition. -.Ip "inputparam arg" -Tell Julius how to deal with speech input in case grammar is changed -just when recognition is running. Specify one: "TERMINATE", "PAUSE", "WAIT" -.Ip "version" -Return version number. -.Ip "status" -Return trigger status (active/sleep). -.SH "COMMANDS (GRAMMAR)" -Below are Grammar-related command strings: -.Ip "changegram prefix" -Change recognition grammar to "prefix.dfa" and "prefix.dict". -All the current grammars used in Julius are deleted and replaced to -the specifed grammar. -.Ip "addgram prefix" -tell Julius to use additional grammar "prefix.dfa" and "prefix.dict" -for recognition. -The specified grammars are added to the list of recognition grammars, -and then activated. -.Ip "deletegram ID" -tell Julius to delete grammar of the specified "ID". -The deleted grammar will be erased from Julius. -The grammar "ID" is sent from Julius at each time grammar information -has changed. -.Ip "deactivategram ID" -tell Julius to de-activate a grammar. The specified grammar will become -temporary OFF, and skipped from recognition process. These de-activated -grammars are kept in Julius, and can be activated by -"activategram" command. -.Ip "activategram ID" -tell Julius to activate previously de-activated grammar. -.Ip "syncgram" -tell Julius to update grammar status now. -.SH "COMMANDS (PROCESS)" -.Ip "listprocess" -returns list of existing recognition process. -.Ip "currentprocess name" -switches the currently manipulating process to it. -.Ip "shiftprocess" -rotate the curenttly manipulating process. -.Ip "addprocess jconffile" -adds a set of LM process SR process to the running engine. The jconf -file should contain only one LM specification, and can be an -accessible path at the server. The new processes will have the name of -the jconf file. -.Ip "delprocess name" -removes a SR process with specified name from -engine. -.Ip "activateprocess name" -enables a SR process previously deactivated and turn it into live status. -.Ip "deactivateprocess name" -disables a specified SR process and turn it into dead status. -.Ip "addword gram_id dictfile" -Send words in the dictfile to engine and add them to the grammar -specified by gram_id at current process. -.SH "EXAMPLE" -The dump messages from Julius are output to tty with prefix -"> " appended to each line. -.PP -See related documents for more details. -.PP -(1) start Julius in module mode at host 'host'. - % julius -C xxx.jconf ... -input mic -module -.PP -(2) (on other tty) start jcontrol, and start communication. - % jcontrol host - connecting to host:10500...done - > - > # 0: [active] 99words, 42categories, 135nodes (new) - > - > - > # 0: [active] 99words, 42categories, 135 nodes - > Grobal: 99words, 42categories, 135nodes - > - > - -> pause - -> resume - > - -> addgram test - .... - -.SH "SEE ALSO" -julius(1) -.SH VERSION -This version is provided as part of Julius-4.0. -.SH COPYRIGHT -Copyright (c) 2002-2007 Kawahara Lab., Kyoto University -.br -Copyright (c) 2002-2005 Shikano Lab., Nara Institute of Science and Technology -.br -Copyright (c) 2005-2007 Julius project team, Nagoya Institute of Technology -.SH AUTHORS -LEE Akinobu (Nagoya Institute of Technology, Japan) -.br -contact: julius-info at lists.sourceforge.jp -.SH LICENSE -Same as -.I Julius. Index: julius4/jcontrol/jcontrol.man.ja diff -u julius4/jcontrol/jcontrol.man.ja:1.2 julius4/jcontrol/jcontrol.man.ja:removed --- julius4/jcontrol/jcontrol.man.ja:1.2 Tue Dec 18 23:08:22 2007 +++ julius4/jcontrol/jcontrol.man.ja Thu Oct 2 17:23:47 2008 @@ -1,136 +0,0 @@ -.de Sp -.if t .sp .5v -.if n .sp -.. -.de Ip -.br -.ie \\n.$>=3 .ne \\$3 -.el .ne 3 -.IP "\\$1" \\$2 -.. -.TH JCONTROL 1 LOCAL -.UC 6 -.SH NAME -jcontrol - simple program to control Julius module via API -.SH SYNOPSIS -.B jcontrol hostname [portnum] -.SH DESCRIPTION -.I jcontrol -は,他のホストで動作中の -.I julius -を,APIを介してコントロールする簡単なコンソールプログラムです. -Julius へのコマンド送信,およびJuliusからのメッセージ受信を行うことが -できます. -.PP -起動後,jcontrol は,指定ホスト上において「モジュールモード」で動作中の -Julius に対し,接続を試みます.接続確立後,jcontrol はユー -ザーからのコマンド入力待ち状態となります. -.PP -jcontrol はユーザーが入力したコマンドを解釈し,対応するAPIコマンドを -Julius へ送信します.また,Julius から認識結果や入力トリガ情報などのメッ -セージが送信されてきたときは,その内容を標準出力へ書き出します. -.PP -APIの詳細については関連文書をご覧下さい. -.SH "OPTIONS" -.Ip hostname -接続先のホスト名(Julius がモジュールモードで動作中) -.Ip portnum -(optional) ポート番号 (default=10500) -.SH "COMMANDS (COMMON)" -起動後,jcontrol に対して以下のコマンド文字列を標準入力から入力できます. -.Ip "pause" -認識を中断する.認識途中の場合,そこで入力を中断して第2パスまで認識が -終わってから中断する. -.Ip "terminate" -認識を中断する.認識途中の場合,入力を破棄して即時中断する. -.Ip "resume" -認識を再開. -.Ip "inputparam arg" -文法切り替え時に音声入力であった場合の入力中音声の扱いを指定. -"TERMINATE", "PAUSE", "WAIT"のうちいずれかを指定. -.Ip "version" -バージョン文字列を返す -.Ip "status" -システムの状態(active/sleep)を返す. -.SH "GRAMMAR COMMANDS" -文法・単語認識用のコマンドです: -.Ip "changegram prefix" -認識文法を "prefix.dfa" と "prefix.dict" に切り替える. -カレントプロセス内の文法は全て消去され,指定された文法に置き換わる. -.Ip "addgram prefix" -認識文法として "prefix.dfa" と "prefix.dict" を追加する. -.Ip "deletegram ID" -指定されたIDの認識文法を削除する. -指定文法はカレントプロセスから削除される.ID は Julian から送られる GRAMINFO -内に記述されている. -.Ip "deactivategram ID" -指定されたIDの認識文法を,一時的にOFFにする.OFFにされた文法は認識処理 -から一時的に除外される.このOFFにされた文法は Julius 内に保持され, -"activategram" コマンドで再び ON にできる. -.Ip "activategram ID" -一時的に OFF になっていた文法を再び ON にする. -.Ip "syncgram" -更新された文法を即時適応する. -.SH "COMMANDS (PROCESS)" -.Ip "listprocess" -現在エンジンにある認識プロセスの一覧を示す. -.Ip "currentprocess name" -コマンドを実行する対象のカレントプロセスを指定されたものに切替える. -.Ip "shiftprocess" -コマンドを実行する対象のカレントプロセスを順に切替える. -.Ip "addprocess jconffile" -エンジンに認識プロセスを追加する.jconffile は1つの LM 設定を含む -もので,サーバ側から見える必要が有る.追加された LM および認識プロセス -は jconffile の名前がプロセス名となる. -.Ip "delprocess name" -指定された名前の認識プロセスをエンジンから削除する. -.Ip "activateprocess name" -以前に一時無効化されたプロセスを再度有効化する. -.Ip "deactivateprocess name" -指定されたプロセスを一時無効化する. -.Ip "addword gram_id dictfile" -dictfile中の単語を,カレントプロセスの gram_id の文法に追加する. -(文法・単語認識のみ) -.SH "EXAMPLE" -Julius からのメッセージは "> " を行の先頭につけて -そのまま標準出力に出力されます. -出力内容の詳細については,関連文書を参照してください. -.PP -(1) Julius をモジュールモードでホスト host で起動する. - % julius -C xxx.jconf ... -input mic -module -.PP -(2) (他の端末で) jcontrol を起動し,通信を開始する. - % jcontrol host - connecting to host:10500...done - > - > # 0: [active] 99words, 42categories, 135nodes (new) - > - > - > # 0: [active] 99words, 42categories, 135 nodes - > Grobal: 99words, 42categories, 135nodes - > - > - -> pause - -> resume - > - -> addgram test - .... - -.SH "SEE ALSO" -julius(1) -.SH BUGS -バグ報告・問い合わせ・コメントなどは -julius-info at lists.sourceforge.jp までお願いします. -.SH VERSION -This version is provided as part of Julius-3.5.1. -.SH COPYRIGHT -Copyright (c) 2002-2007 京都大学 河原研究室 -.br -Copyright (c) 2002-2005 奈良先端科学技術大学院大学 鹿野研究室 -.br -Copyright (c) 2005-2007 名古屋工業大学 Julius開発チーム -.SH AUTHORS -李 晃伸 (名古屋工業大学) が実装しました. -.SH LICENSE -.I Julius -の使用許諾に準じます. From sumomo @ users.sourceforge.jp Thu Oct 2 17:23:47 2008 From: sumomo @ users.sourceforge.jp (sumomo @ users.sourceforge.jp) Date: Thu, 02 Oct 2008 17:23:47 +0900 Subject: [Julius-cvs 285] CVS update: julius4/libjulius Message-ID: <1222935827.862235.32348.nullmailer@users.sourceforge.jp> Index: julius4/libjulius/jconf.man diff -u julius4/libjulius/jconf.man:1.1 julius4/libjulius/jconf.man:removed --- julius4/libjulius/jconf.man:1.1 Tue Dec 18 23:09:23 2007 +++ julius4/libjulius/jconf.man Thu Oct 2 17:23:47 2008 @@ -1,1053 +0,0 @@ -.TH "jconf " "5 " -.SH NAME -jconf -\- Jconf configuration file specification -.SH DESCRIPTION -The variables that can be written in Jconf file are organized as follows. -.TP 0.2i -\(bu -Global options -.TP 0.2i -\(bu -Instance declaration -.TP 0.2i -\(bu -Language model instance -.TP 0.2i -\(bu -Acoustic model and speech analysis instance -.TP 0.2i -\(bu -Recognizer and search instance -.PP -The details are described in the followings. -.SH EXAMPLE -These are examples of jconf file. -.PP -First example is a simple one with no instance declaration. When -no instance declaration is found, Julius assumes there are only -one AM, LM and recognition process instance. In this case, the -default instance will be named "\fB_default\fR", and -option order does not matter. This is equivalent to older version -of Julius, except for GMM handling (see below). -.PP -\fBExample of Jconf file: no instance declaration\fR -.PP -.nf - - \-C jconffile - (\fIOther global options\fR...) - (\fIAM and analysis options\fR...) - (\fILM options\fR...) - (\fISearch options\fR...) - -.fi -.PP -This is an example using two acoustic models and three language -models of different types. Three recognition process instance is -defined for each combination of AM and LM. The LM type (ngram / -grammar / word) is determined by the arguments. The Global -options are placed at the top in the example, but actually it can -be placed anywhere in the file. -.PP -\fBExample of Jconf file: multi model decoding\fR -.PP -.nf - - \-C jconffile - (\fIOther global options\fR...) - \-AM am1 - (\fIAM and analysis options for am1\fR...) - \-AM am2 - (\fIAM and analysis options for am2\fR...) - \-LM lm_ngram - \-d ngram \-v dictfile - (\fILM options for lm1\fR...) - \-LM lm_grammar - \-gram grammarprefix - (\fILM options for lm2\fR...) - \-LM lm_word - \-w dictfile - (\fILM options for lm3\fR...) - \-SR recog_ngram am1 lm_ngram - (\fISearch options for recog_ngram\fR...) - \-SR recog_grammar am1 lm_grammar - (\fISearch options for recog_ngram\fR...) - \-SR recog_word am2 lm_word - (\fISearch options for recog_ngram\fR...) - -.fi -.PP -This is another example using GMM for frontend processing. Note -that from Rev.4.0 Julius has independent MFCC calculation scheme -for GMM. This means that you should explicitly specify the -acoustic analysis condition for GMM, not only the AM. -.PP -Option \fB\-AM_GMM\fR switch the current AM configuration -to the one prepared internally for GMM. You can place AM configuration -after the option to specify MFCC computation parameter for GMM. -If you define exactly the same condition as AM for recognition, -the same MFCC calculation instance will be shared among AM and GMM. -Else, each MFCC will be computed independently. -.PP -\fBExample with GMM\fR -.PP -.nf - - \-C jconffile - (\fIOther global options\fR...) - \-gmm gmmdefs \-gmmreject noise - \-AM_GMM - (\fIanalysis options for GMM\fR...) - \-AM am1 - (\fIAM and analysis options for am1\fR...) - \-LM lm_ngram - \-d ngram \-v dictfile - (\fILM options for lm1\fR...) - \-SR recog_ngram am1 lm_ngram - -.fi -.SH "JCONF VARIABLES" -The full list of options and variables that can be specified in jconf -file is listed below. -.SS "GLOBAL OPTIONS " -.RS -.SS "Misc. options" -.RE -.TP -\fB\-C \fR\fIjconffile\fR -Load a jconf file. The options written in the file are -expanded at the point. This option can be used within -other jconf file. -.TP -\fB\-version \fR -Print version information to standard error, and exit. -.TP -\fB\-setting \fR -Print engine setting information to standard error, and exit. -.TP -\fB\-quiet \fR -Output less log. For result, only the best word sequence will be -printed. -.TP -\fB\-debug \fR -(For debug) output enoumous internal message and debug -information to log. -.TP -\fB\-check \fR\fB{wchmm|trellis|triphone}\fR -For debug, enter interactive check mode. -.RS -.SS "Audio input" -.RE -.TP -\fB\-input \fR\fB{mic|rawfile|mfcfile|adinnet|stdin|netaudio} \fR -Choose speech input source. 'file' or 'rawfile' for waveform -file, 'htkparam' or 'mfcfile' for HTK parameter file. Users will -be prompted to enter the file name from stdin, or you can use -"\-filelist" option to specify list of files to process. - -\&'mic' is to get audio input from live microphone device, and -\&'adinnet' means receiving waveform data via tcpip network from -an adinnet client. 'netaudio' is from DatLink/NetAudio input, -and 'stdin' means data input from standard input. - -For waveform file input, only WAV (no -compression) and RAW (noheader, 16bit, -big endian) are supported by default. Other format can be read -when compiled with \fBlibsnd\fR library. To see -what format is actually supported, see the help message using -option "\-help". For stdin input, only WAV and RAW is -supported. (default: mfcfile) -.TP -\fB\-filelist \fR\fIfilename\fR -(With \-input rawfile|mfcfile) perform recognition on all files -listed in the file. The file should contain an input file -per line. Engine ends when all of the files are processed. -.TP -\fB\-notypecheck \fR -By default, Julius checks the input parameter type whether it -matches the AM or not. This option will disable the check and -use the input vector as is. -.TP -\fB\-48 \fR -Record input with 48kHz sampling, and down\-sample it to 16kHz -on\-the\-fly. This option is valid for 16kHz model only. The -down\-sampling routine was ported from sptk. -(Rev. 4.0) -.TP -\fB\-NA \fR\fIdevicename\fR -Host name for DatLink server input (\fB\-input netaudio\fR). -.TP -\fB\-adport \fR\fIport_number\fR -With \fB\-input adinnet\fR, specify adinnet port -number to listen. (default: 5530) -.TP -\fB\-nostrip \fR -Julius by default removes successive zero samples in input -speech data. This option inhibits this removal. -.TP -\fB\-zmean \fR, \fB\-nozmean \fR -This option enables/disables DC offset removal of input -waveform. Offset will be estimated from the whole input. For -microphone / network input, zero mean of the first 48000 -samples (3 seconds in 16kHz sampling) will be used for the -estimation. (default: disabled) - -This option uses static offset for the channel. See also -\fB\-zmeansource\fR for frame\-wise offset removal. -.RS -.SS "Speech segment detection by level and zero\-cross" -.RE -.TP -\fB\-cutsilence \fR, \fB\-nocutsilence \fR -Turn on / off the speech detection by level and zero\-cross. -Default is on for mic / adinnet input, off for files. -.TP -\fB\-lv \fR\fIthres\fR -Level threshold for speech input detection. Values should be -from 0 to 32767. -.TP -\fB\-zc \fR\fIthres\fR -Zero crossing threshold per second. Only waves over the level -threshold (\fB\-lv\fR) will be counted. (default: 60) -.TP -\fB\-headmargin \fR\fImsec\fR -Silence margin at the start of speech segment in -milliseconds. (default: 300) -.TP -\fB\-tailmargin \fR\fImsec\fR -Silence margin at the end of speech segment in milliseconds. -(default: 400) -.TP -\fB\-rejectshort \fR\fImsec\fR -Reject input shorter than specified milliseconds. Search will -be terminated and no result will be output. -.RS -.SS "Input rejection by average power" -.RE -.PP -This feature will be enabled by -\fB\-\-enable\-power\-reject\fR on compilation. Should be -used with Decoder VAD or GMM VAD. Valid for real\-time input only. -.TP -\fB\-powerthres \fR\fIthres\fR -Reject the inputted segment by its average energy. If the -average energy of the last recognized input is below the -threshold, Julius will reject the input. (Rev.4.0) - -This option is valid when -\fB\-\-enable\-power\-reject\fR is specified -at compilation time. -.RS -.SS "Gaussian mixture model" -.RE -.PP -GMM will be used for input rejection by accumurated score, or for -GMM\-based frontend VAD when \fB\-\-enable\-gmm\-vad\fR is specified. -.PP -NOTE: You should also set the proper MFCC parameters required for the -GMM, specifying the acoustic parameters described in AM section -\fB\-AM_GMM\fR. -.TP -\fB\-gmm \fR\fIhmmdefs_file\fR -GMM definition file in HTK format. If specified, GMM\-based -input verification will be performed concurrently with the 1st -pass, and you can reject the input according to the result as -specified by \fB\-gmmreject\fR. The GMM should be -defined as one\-state HMMs. -.TP -\fB\-gmmnum \fR\fInumber\fR -Number of Gaussian components to be computed per frame on GMM -calculation. Only the N\-best Gaussians will be computed for -rapid calculation. The default is 10 and specifying smaller -value will speed up GMM calculation, but too small value (1 or -2) may cause degradation of identification performance. -.TP -\fB\-gmmreject \fR\fIstring\fR -Comma\-separated list of GMM names to be rejected as invalid -input. When recognition, the log likelihoods of GMMs -accumulated for the entire input will be computed concurrently -with the 1st pass. If the GMM name of the maximum score is -within this string, the 2nd pass will not be executed and the -input will be rejected. -.TP -\fB\-gmmmargin \fR\fIframes\fR -Head margin for GMM\-based VAD in frames. (Rev.4.0) - -This option will be valid only if compiled with -\fB\-\-enable\-gmm\-vad\fR. -.RS -.SS "Decoding option" -.RE -.PP -Real\-time processing means concurrent processing of MFCC computation -1st pass decoding. By default, real\-time processing on the pass is on -for microphone / adinnet / netaudio input, and for others. -.TP -\fB\-realtime \fR, \fB\-norealtime \fR -Explicitly switch on / off real\-time (pipe\-line) processing on -the first pass. The default is off for file input, and on for -microphone, adinnet and NetAudio input. This option relates -to the way CMN and energy normalization is performed: if off, -they will be done using average features of whole input. If -on, MAP\-CMN and energy normalization to do rea\-time processing. -.SS "INSTANCE DECLARATION FOR MULTI DECODING " -The following arguments will create a new configuration set with -default parameters, and switch current set to it. Jconf parameters -specified after the option will be set into the current set. -.PP -To do multi\-model decoding, these argument should be specified at -the first of each model / search instances with different names. -Any options before the first instance definition will be IGNORED. -.PP -When no instance definition is found (as older version of Julius), -all the options are assigned to a default instance named "_default". -.PP -Please note that decoding with a single LM and multiple AMs is not -fully supported. For example, you may want to construct the -jconf file as following. - -.nf - - \-AM am_1 \-AM am_2 - \-LM lm (LM spec..) - \-SR search1 am_1 lm - \-SR search2 am_2 lm -.fi - -This type of model sharing is not supported yet, since some part -of LM processing depends on the assigned AM. Instead, you can -get the same result by defining the same LMs for each AM, like this: - -.nf - - \-AM am_1 \-AM am_2 - \-LM lm_1 (LM spec..) - \-LM lm_2 (same LM spec..) - \-SR search1 am_1 lm_1 - \-SR search2 am_2 lm_2 -.fi - -.TP -\fB\-AM \fR\fIname\fR -Create a new AM configuration set, and switch current to the -new one. You should give a unique name. (Rev.4.0) -.TP -\fB\-LM \fR\fIname\fR -Create a new LM configuration set, and switch current to the -new one. You should give a unique name. (Rev.4.0) -.TP -\fB\-SR \fR\fIname\fR \fIam_name\fR \fIlm_name\fR -Create a new search configuration set, and switch current to -the new one. The specified AM and LM will be assigned to it. -The \fIam_name\fR and -\fIlm_name\fR can be either name or ID -number. You should give a unique name. (Rev.4.0) -.TP -\fB\-AM_GMM \fR -A special command to switch AM configuration set for -specifying speech analysis parameters of GMM. The current AM -will be switched to the GMM specific one already reserved, so -be careful not to confuse with normal AM configurations. -(Rev.4.0) -.SS "LANGUAGE MODEL (\-LM) " -Only one type of LM can be specified for a LM configuration. -If you want to use multi model, you should define them one by one, -each as a new LM. -.RS -.SS N\-gram -.RE -.TP -\fB\-d \fR\fIbingram_file\fR -Use binary format N\-gram. An ARPA N\-gram file can be -converted to Julius binary format by -mkbingram. -.TP -\fB\-nlr \fR\fIarpa_ngram_file\fR -A forward, left\-to\-right N\-gram language model in standard -ARPA format. When both a forward N\-gram and backward N\-gram -are specified, Julius uses this forward 2\-gram for the 1st -pass, and the backward N\-gram for the 2nd pass. - -Since ARPA file often gets huge and requires a lot of time to -load, it may be better to convert the ARPA file to Julius -binary format by mkbingram. Note that if -both forward and backward N\-gram is used for recognition, they -together should be converted to a single binary. - -When only a forward N\-gram is specified by this option and no -backward N\-gram specified by \fB\-nrl\fR, Julius -performs recognition with only the forward N\-gram. The 1st -pass will use the 2\-gram entry in the given N\-gram, and -The 2nd pass will use the given N\-gram, with converting -forward probabilities to backward probabilities by Bayes rule. -(Rev.4.0) -.TP -\fB\-nrl \fR\fIarpa_ngram_file\fR -A backward, right\-to\-left N\-gram language model in standard -ARPA format. When both a forward N\-gram and backward N\-gram -are specified, Julius uses the forward 2\-gram for the 1st -pass, and this backward N\-gram for the 2nd pass. - -Since ARPA file often gets huge and requires a lot of time to -load, it may be better to convert the ARPA file to Julius -binary format by mkbingram. Note that if -both forward and backward N\-gram is used for recognition, they -together should be converted to a single binary. - -When only a backward N\-gram is specified by this option and no -forward N\-gram specified by \fB\-nlr\fR, Julius -performs recognition with only the backward N\-gram. The 1st -pass will use the forward 2\-gram probability computed from the -backward 2\-gram using Bayes rule. The 2nd pass fully use the -given backward N\-gram. (Rev.4.0) -.TP -\fB\-v \fR\fIdict_file\fR -Word dictionary file. -.TP -\fB\-silhead \fR\fIword_string\fR \fB\-siltail \fR\fIword_string\fR -Silence word defined in the dictionary, for silences at -the beginning of sentence and end of sentence. (default: -"", "") -.TP -\fB\-iwspword \fR -Add a word entry to the dictionary that should correspond to -inter\-word pauses. This may improve recognition accuracy in -some language model that has no explicit inter\-word pause -modeling. The word entry to be added can be changed by -\fB\-iwspentry\fR. -.TP -\fB\-iwspentry \fR\fIword_entry_string\fR -Specify the word entry that will be added by -\fB\-iwspword\fR. (default: " [sp] sp -sp") -.TP -\fB\-sepnum \fR\fInumber\fR -Number of high frequency words to be isolated from the lexicon -tree, to ease approximation error that may be caused by the -one\-best approximation on 1st pass. (default: 150) -.RS -.SS Grammar -.RE -.PP -Multiple grammars can be specified by using \fB\-gram\fR and -\fB\-gramlist\fR. When you specify grammars using these -options multiple times, all of them will be read at startup. Note -that this is unusual behavior from other options (in normal Julius -option, last one override previous ones). You can use -\fB\-nogram\fR to reset the already specified grammars at -that point. -.TP -\fB\-gram \fR\fBgramprefix1[,gramprefix2[,gramprefix3,...]] \fR -Comma\-separated list of grammars to be used. the argument -should be prefix of a grammar, i.e. if you have -\fBfoo.dfa\fR and -\fBfoo.dict\fR, you can specify them by single -argument \fBfoo\fR. Multiple grammars can be -specified at a time as a comma\-separated list. -.TP -\fB\-gramlist \fR\fIlist_file\fR -Specify a grammar list file that contains list of grammars to -be used. The list file should contain the prefixes of -grammars, each per line. A relative path in the list file -will be treated as relative to the list file, not the current -path or configuration file. -.TP -\fB\-dfa \fR\fIdfa_file\fR \fB\-v \fR\fIdict_file\fR -An old way of specifying grammar files separately. -.TP -\fB\-nogram \fR -Remove the current list of grammars already specified by -\fB\-gram\fR, \fB\-gramlist\fR, -\fB\-dfa\fR and \fB\-v\fR. -.RS -.SS "Isolated word" -.RE -.PP -Multiple dictionary can be specified by using \fB\-w\fR and -\fB\-wlist\fR. When you specify multiple times, all of them -will be read at startup. You can use \fB\-nogram\fR to -reset the already specified dictionaries at that point. -.TP -\fB\-w \fR\fIdict_file\fR -Word dictionary for isolated word recognition. File format -is the same as other LM. (Rev.4.0) -.TP -\fB\-wlist \fR\fIlist_file\fR -Specify a dictionary list file that contains list of -dictionaries to be used. The list file should contain the -file name of dictionaries, each per line. A relative path in -the list file will be treated as relative to the list file, -not the current path or configuration file. (Rev.4.0) -.TP -\fB\-nogram \fR -Remove the current list of dictionaries already specified by -\fB\-w\fR and \fB\-wlist\fR. -.TP -\fB\-wsil \fR\fIhead_sil_model_name\fR \fItail_sil_model_name\fR \fIsil_context_name\fR -On isolated word recognition, silence models will be appended -to the head and tail of each word at recognition. This option -specifies the silence models to be appended. -\fIsil_context_name\fR is the name of the -head sil model and tail sil model as a context of word head -phone and tail phone. For example, if you specify -\fB\-wsil silB silE sp\fR, a word with phone -sequence \fBb eh t\fR will be translated as -\fBsilB sp\-b+eh b\-eh+t eh\-t+sp silE\fR. -(Rev.4.0) -.RS -.SS "User\-defined LM" -.RE -.TP -\fB\-userlm \fR -Declare to use user LM defined in program. This option should be -specified if you use user\-defined LM function. (Rev.4.0) -.RS -.SS "Misc LM options" -.RE -.TP -\fB\-forcedict \fR -Ignore dictionary errors and force running. Words with errors -will be skipped at startup. -.SS "ACOUSTIC MODEL AND SPEECH ANALYSIS (\-AM) (\-AM_GMM) " -Acoustic analysis parameters are included in this section, since the -AM defines the required parameter. You can use different MFCC type -for each AM. For GMM, the same parameter should be specified after -\fB\-AM_GMM\fR -.PP -When using multiple AM, the values of \fB\-smpPeriod\fR, -\fB\-smpFreq\fR, \fB\-fsize\fR and -\fB\-fshift\fR should have the same value among all AMs. -.RS -.SS "acoustic HMM and parameters" -.RE -.TP -\fB\-h \fR\fIhmmdef_file\fR -Acoustic HMM definition file. File should be in HTK ascii -format, or Julius binary format. You can convert HTK ascii hmmdefs -to Julius binary format by mkbinhmm. -.TP -\fB\-hlist \fR\fIhmmlist_file\fR -HMMList file for phone mapping. This options is required when -using a triphone model. This file provides a mapping between -logical triphone names genertated from the dictionary and defined -HMM names in hmmdefs. -.TP -\fB\-tmix \fR\fInumber\fR -Specify the number of top Gaussians to be calculted in a -mixture codebook. Small number will speed up the acoustic -computation namely in a tied\-mixture model, but AM accuracy may -get worse on too small value. (default: 2) -.TP -\fB\-spmodel \fR\fIname\fR -Specify an HMM name that corresponds to short\-pause model in -HMM. This option will affect various aspects in recognition: -short\-pause skipping process on grammar recognition, word\-end -short\-pause model insertion with \fB\-iwsp\fR on -N\-gram recognition, or short\-pause segmentation -(\fB\-spsegment\fR). (default: "sp") -.TP -\fB\-multipath \fR -Enable multi\-path mode. Multi\-path mode expand state -transition availability to allow model\-skipping, or multiple -output/input transitions in HMMs. However, since defining -additional word begin / end node and perform extra transition -check on decoding, the beam width may be required to set larger -and recognition becomes a bit slower. - -By default (without this option), Julius automatically check -the transition type of specified HMMs, and enable the -multi\-path mode if required. You can force Julius to enable multi\-path -mode with this option. (rev.4.0) -.TP -\fB\-gprune \fR\fB{safe|heuristic|beam|none|default} \fR -Set Gaussian pruning algotrihm to use. The default setting -will be set according to the model type and engine setting. -"default" will force accepting the default setting. Set this -to "none" to disable pruning and perform full -computation. "safe" gualantees the top N Gaussians to be -computed. "heuristic" and "beam" do more aggressive -computational cosst reduction, but may result in small loss of -accuracy model (default: 'safe' (standard), 'beam' (fast) for -tied mixture model, 'none' for non tied\-mixture model). -.TP -\fB\-iwcd1 \fR\fB{max|avg|best number} \fR -Select method to approximate inter\-word triphone on the head -and tail of a word in the first pass. - -"max" will apply the maximum likelihood of the same context -triphones. "avg" will apply the average likelihood of the -same context triphones. "best number" will apply the average -of top N\-best likelihoods of the same context -triphone. - -Default is "best 3" for use with N\-gram, and "avg" for grammar -and word. When this AM is shared by LMs of both type, -latter one will be chosen. -.TP -\fB\-iwsppenalty \fR\fIfloat\fR -Short pause insertion penalty for appended short pauses by -\fB\-iwsp\fR. -.TP -\fB\-gshmm \fR\fIhmmdef_file\fR -If this option is specified, Julius performs Gaussian Mixture -Selection for efficient decoding. The hmmdefs should be a -monophone model generated from an ordinary monophone HMM -model, using mkgshmm. -.TP -\fB\-gsnum \fR\fInumber\fR -On GMS, specify number of monophone state from top to -compute the detailed corresponding triphones. (default: 24) -.RS -.SS "Speech analysis parameters" -.RE -.TP -\fB\-smpPeriod \fR\fIperiod\fR -Set sampling frequency of input speech by its sampling period, -in unit of 100 nanoseconds. Sampling rate can also be -specified by \fB\-smpFreq\fR. Please note that the -input frequency should be the same as trained conditions of -acoustic model you use. (default: 625 = 16000Hz) - -This option corresponds to the HTK Option "SOURCERATE". -The same value can be given to this option. - -When using multiple AM, this value should be the same among all -AMs. -.TP -\fB\-smpFreq \fR\fIHz\fR -Set sampling frequency of input speech in Hz. Sampling rate -can also be specified using "\-smpPeriod". Please note that -this frequency should be the same as the trained conditions of -acoustic model you use. (default: 16000) - -When using multiple AM, this value should be the same among all -AMs. -.TP -\fB\-fsize \fR\fIsample_num\fR -Window size in number of samples. (default: 400) - -This option corresponds to the HTK Option "WINDOWSIZE", -but value should be in samples (HTK value / smpPeriod). - -When using multiple AM, this value should be the same among all -AMs. -.TP -\fB\-fshift \fR\fIsample_num\fR -Frame shift in number of samples. (default: 160) - -This option corresponds to the HTK Option "TARGETRATE", -but value should be in samples (HTK value / smpPeriod). - -When using multiple AM, this value should be the same among all -AMs. -.TP -\fB\-preemph \fR\fIfloat\fR -Pre\-emphasis coefficient. (default: 0.97) - -This option corresponds to the HTK Option "PREEMCOEF". -The same value can be given to this option. -.TP -\fB\-fbank \fR\fInum\fR -Number of filterbank channels. (default: 24) - -This option corresponds to the HTK Option "NUMCHANS". -The same value can be given to this option. -Be aware that the default value differs from HTK (22). -.TP -\fB\-ceplif \fR\fInum\fR -Cepstral liftering coefficient. (default: 22) - -This option corresponds to the HTK Option "CEPLIFTER". -The same value can be given to this option. -.TP -\fB\-rawe \fR, \fB\-norawe \fR -Enable/disable using raw energy before pre\-emphasis (default: disabled) - -This option corresponds to the HTK Option "RAWENERGY". -Be aware that the default value differs from HTK (enabled at HTK, -disabled at Julius). -.TP -\fB\-enormal \fR, \fB\-noenormal \fR -Enable/disable normalizing log energy. On live input, this -normalization will be approximated from the average of last -input. (default: disabled) - -This option corresponds to the HTK Option "ENORMALISE". -Be aware that the default value differs from HTK (enabled at HTK, -disabled at Julius). -.TP -\fB\-escale \fR\fIfloat_scale\fR -Scaling factor of log energy when normalizing log -energy. (default: 1.0) - -This option corresponds to the HTK Option "ESCALE". -Be aware that the default value differs from HTK (0.1). -.TP -\fB\-silfloor \fR\fIfloat\fR -Energy silence floor in dB when normalizing log energy. -(default: 50.0) - -This option corresponds to the HTK Option "SILFLOOR". -.TP -\fB\-delwin \fR\fIframe\fR -Delta window size in number of frames. (default: 2) - -This option corresponds to the HTK Option "DELTAWINDOW". -The same value can be given to this option. -.TP -\fB\-accwin \fR\fIframe\fR -Acceleration window size in number of frames. (default: 2) - -This option corresponds to the HTK Option "ACCWINDOW". -The same value can be given to this option. -.TP -\fB\-hifreq \fR\fIHz\fR -Enable band\-limiting for MFCC filterbank computation: set -upper frequency cut\-off. Value of \-1 will disable it. -(default: \-1) - -This option corresponds to the HTK Option "HIFREQ". -The same value can be given to this option. -.TP -\fB\-lofreq \fR\fIHz\fR -Enable band\-limiting for MFCC filterbank computation: set -lower frequency cut\-off. Value of \-1 will disable it. -(default: \-1) - -This option corresponds to the HTK Option "LOFREQ". -The same value can be given to this option. -.TP -\fB\-zmeanframe \fR, \fB\-nozmeanframe \fR -With speech input, this option enables/disables frame\-wise DC -offset removal. This corresponds to HTK configuration -ZMEANSOURCE. This cannot be used with "\-zmean". -(default: disabled) -.RS -.SS "Real\-time cepstral mean normalization" -.RE -.TP -\fB\-cmnload \fR\fIfile\fR -Load initial cepstral mean vector from file on startup. The -file shoudld be one saved by \fB\-cmnsave\fR. -Loading an initial cepstral mean enables Julius to better -recognize the first utterance on a microphone / network input. -.TP -\fB\-cmnsave \fR\fIfile\fR -Save cepstral mean vector at each input. The parameters will -be saved to the file at each input end, so the output file -always keeps the last cepstral mean. If output file already -exist, it will be overridden. -.TP -\fB\-cmnupdate \fR\fB\-cmnnoupdate \fR -Control whether to update the cepstral mean at each input on -microphone / network input. Disabling this and specifying -\fB\-cmnload\fR will make engine to use the initial -cepstral mean parmanently. -.TP -\fB\-cmnmapweight \fR\fIfloat\fR -Specify weight of initial cepstral mean for MAP\-CMN. Specify -larger value to retain the initial cepstral mean for a longer -period, and smaller value to rely more on the current input. -(default: 100.0) -.RS -.SS "Spectral subtraction" -.RE -.TP -\fB\-sscalc \fR -Perform spectral subtraction using head part of each file. -Valid only for raw speech file input. Conflict with -\fB\-ssload\fR. -.TP -\fB\-sscalclen \fR\fImsec\fR -With \fB\-sscalc\fR, specify the length of head part -silence in milliseconds. (default: 300) -.TP -\fB\-ssload \fR\fIfile\fR -Perform spectral subtraction for speech input using -pre\-estimated noise spectrum from file. The noise spectrum -should be computed beforehand by mkss. -Valid for all speech input. Conflict with -\fB\-sscalc\fR. -.TP -\fB\-ssalpha \fR\fIfloat\fR -Alpha coefficient of spectral subtraction for -\-sscalc and \-ssload. -Noise will be subtracted stronger as this value gets larger, -but distortion of the resulting signal also becomes -remarkable. (default: 2.0) -.TP -\fB\-ssfloor \fR\fIfloat\fR -Flooring coefficient of spectral subtraction. The spectral -power that goes below zero after subtraction will be -substituted by the source signal with this coefficient -multiplied. (default: 0.5) -.RS -.SS "Misc AM options" -.RE -.TP -\fB\-htkconf \fR\fIfile\fR -Parse the given HTK Config file, and set corresponding -parameters to Julius. When using this option, the default -parameter values are switched from Julius defaults to HTK -defaults. -.SS "RECOGNIZER AND SEARCH (\-SR) " -Default values for beam width and LM weights will change according to -compile\-time setup of JuliusLib and model specification. Please see -the startup log for the actual values. -.RS -.SS "General parameters" -.RE -.TP -\fB\-inactive \fR -Start this recognition process instance with inactive state. (Rev.4.0) -.TP -\fB\-1pass \fR -Perform only the first pass. This mode is automatically set -at isolated word recognition. -.TP -\fB\-no_ccd \fR, \fB\-force_ccd \fR -Normally Julius determines whether the specified acoustic -model is a context\-dependent model from the model names, i.e., -whether the model names contain character \fB+\fR -and \fB\-\fR. You can explicitly specify by these -options to avoid mis\-detection. These option will override -automatic detection. -.TP -\fB\-cmalpha \fR\fIfloat\fR -Smoothing patemeter for confidence scoring. (default: 0.05) -.TP -\fB\-iwsp \fR -(Multi\-path mode only) Enable inter\-word context\-free short -pause handling. This option appends a skippable short pause -model for every word end. The added model will be skipped on -inter\-word context handling. The HMM model to be appended can -be specified by \fB\-spmodel\fR. -.TP -\fB\-transp \fR\fIfloat\fR -Additional insertion penalty for transparent words. (default: -0.0) -.TP -\fB\-demo \fR -Equivalent to \fB\-progout \-quiet\fR. -.RS -.SS "1st pass parameters" -.RE -.TP -\fB\-lmp \fR\fIweight\fR \fIpenalty\fR -(N\-gram) Language model weights and word insertion penalties -for the first pass. -.TP -\fB\-penalty1 \fR\fIpenalty\fR -(Grammar) word insertion penalty for the first pass. (default: 0.0) -.TP -\fB\-b \fR\fIwidth\fR -Beam width for rank beam in number of HMM nodes on the first -pass. This value defines search width on the 1st pass, and -has great effect on the total processing time. Smaller width -will speed up the decoding, but too small value will result in -a substantial increase of recognition errors due to search -failure. Larger value will make the search stable and will -lead to failure\-free search, but processing time and memory -usage will grow in proportion to the width. - -The default value is dependent on acoustic model type: 400 -(monophone), 800 (triphone), or 1000 (triphone, setup=v2.1) -.TP -\fB\-nlimit \fR\fInum\fR -Upper limit of token per node. This option is valid when -\fB\-\-enable\-wpair\fR and -\fB\-\-enable\-wpair\-nlimit\fR are enabled at -compilation time. -.TP -\fB\-progout \fR -Enable progressive output of the partial results on the first pass. -.TP -\fB\-proginterval \fR\fImsec\fR -Set the output time interval of \fB\-progout\fR in -milliseconds. -.RS -.SS "2nd pass parameters" -.RE -.TP -\fB\-lmp2 \fR\fIweight\fR \fIpenalty\fR -(N\-gram) Language model weights and word insertion penalties -for the second pass. -.TP -\fB\-penalty2 \fR\fIpenalty\fR -(Grammar) word insertion penalty for the second pass. (default: 0.0) -.TP -\fB\-b2 \fR\fIwidth\fR -Envelope beam width (number of hypothesis) in second pass. If -the count of word expantion at a certain length of hypothesis -reaches this limit while search, shorter hypotheses are not -expanded further. This prevents search to fall in -breadth\-first\-like status stacking on the same position, and -improve search failure. (default: 30) -.TP -\fB\-sb \fR\fIfloat\fR -Score envelope width for enveloped scoring. When calculating -hypothesis score for each generated hypothesis, its trellis -expansion and viterbi operation will be pruned in the middle -of the speech if score on a frame goes under the width. -Giving small value makes the second pass faster, but -computation error may occur. (default: 80.0) -.TP -\fB\-s \fR\fInum\fR -Stack size, i.e. the maximum number of hypothesis that can be -stored on the stack during the search. A larger value may -give more stable results, but increases the amount of memory -required. (default: 500) -.TP -\fB\-m \fR\fIcount\fR -Number of expanded hypotheses required to discontinue the -search. If the number of expanded hypotheses is greater then -this threshold then, the search is discontinued at that point. -The larger this value is, The longer Julius gets to give up -search. (default: 2000) -.TP -\fB\-n \fR\fInum\fR -The number of candidates Julius tries to find. The search -continues till this number of sentence hypotheses have been -found. The obtained sentence hypotheses are sorted by score, -and final result is displayed in the order (see also the -\fB\-output\fR). The possibility that the optimum -hypothesis is correctly found increases as this value gets -increased, but the processing time also becomes longer. The -default value depends on the engine setup on compilation time: -10 (standard) or 1 (fast or v2.1) -.TP -\fB\-output \fR\fInum\fR -The top N sentence hypothesis to be output at the end of -search. Use with \fB\-n\fR (default: 1) -.TP -\fB\-lookuprange \fR\fIframe\fR -When performing word expansion on the second pass, this option -sets the number of frames before and after to look up next -word hypotheses in the word trellis. This prevents the -omission of short words, but with a large value, the number of -expanded hypotheses increases and system becomes -slow. (default: 5) -.TP -\fB\-looktrellis \fR -(Grammar) Expand only the words survived on the first pass -instead of expanding all the words predicted by grammar. This -option makes second pass decoding slightly faster especially -for large vocabulary condition, but may increase deletion -error of short words. (default: disabled) -.RS -.SS "Short\-pause segmentation" -.RE -.PP -When compiled with \fB\-\-enable\-decoder\-vad\fR, the -short\-pause segmentation will be extended to support decoder\-based -VAD. -.TP -\fB\-spsegment \fR -Enable short\-pause segmentation mode. Input will be segmented -when a short pause word (word with only silence model in -pronunciation) gets the highest likelihood at certain -successive frames on the first pass. When detected segment -end, Julius stop the 1st pass at the point, perform 2nd pass, -and continue with next segment. The word context will be considered -among segments. (Rev.4.0) - -When compiled with \fB\-\-enable\-decoder\-vad\fR, -this option enables decoder\-based VAD, to skip long silence. -.TP -\fB\-spdur \fR\fIframe\fR -Short pause duration length to detect end of input segment, in -number of frames. (default: 10) -.TP -\fB\-pausemodels \fR\fIstring\fR -A comma\-separated list of pause model names to be used at short\-pause -segmentation. The word with only the pause models will be treated -as "pause word" for pause detectionin. If not specified, name -of \fB\-spmodel\fR, \fB\-silhead\fR and -\fB\-siltail\fR will be used. (Rev.4.0) -.TP -\fB\-spmargin \fR\fIframe\fR -Backstep margin at trigger up for decoder\-based VAD. (Rev.4.0) - -This option will be valid only if compiled with -\fB\-\-enable\-decoder\-vad\fR. -.TP -\fB\-spdelay \fR\fIframe\fR -Trigger decision delay frame at trigger up for decoder\-based -VAD. (Rev.4.0) - -This option will be valid only if compiled with -\fB\-\-enable\-decoder\-vad\fR. -.RS -.SS "Lattice / confusion network output" -.RE -.TP -\fB\-lattice \fR, \fB\-nolattice \fR -Enable / disable generation of word graph. Search -algorithm also has changed to optimize for better word graph -generation, so the sentence result may not be the same as -normal N\-best recognition. (Rev.4.0) -.TP -\fB\-confnet \fR, \fB\-noconfnet \fR -Enable / disable generation of confusion network. Enabling -this will also activates \fB\-lattice\fR internally. -(Rev.4.0) -.TP -\fB\-graphrange \fR\fIframe\fR -Merge same words at neighbor position at graph generation. If -the position of same words differs smaller than this value, -they will be merged. The default is 0 (allow merging on -exactly the same location) and specifying larger value will -result in smaller graph output. Setting to \-1 will disable -merging, in that case same words on the same location of -different scores will be left as they are. (default: 0) -.TP -\fB\-graphcut \fR\fIdepth\fR -Cut the resulting graph by its word depth at post\-processing -stage. The depth value is the number of words to be allowed -at a frame. Setting to \-1 disables this feature. (default: -80) -.TP -\fB\-graphboundloop \fR\fIcount\fR -Limit the number of boundary adjustment loop at -post\-processing stage. This parameter prevents Julius from -blocking by infinite adjustment loop by short word -oscillation. (default: 20) -.TP -\fB\-graphsearchdelay \fR, \fB\-nographsearchdelay \fR -When "\-graphsearchdelay" option is set, Julius modifies its -graph generation alogrithm on the 2nd pass not to terminate -search by graph merging, until the first sentence candidate is -found. This option may improve graph accuracy, especially -when you are going to generate a huge word graph by setting -broad search. Namely, it may result in better graph accuracy -when you set wide beams on both 1st pass \fB\-b\fR -and 2nd pass \fB\-b2\fR, and large number for -\fB\-n\fR. (default: disabled) -.RS -.SS "Multi\-gram / multi\-dic output" -.RE -.TP -\fB\-multigramout \fR, \fB\-nomultigramout \fR -On grammar recognition using multiple grammars, Julius will -output only the best result among all grammars. Enabling this -option will make Julius to output result for each grammar. -(default: disabled) -.RS -.SS "Forced alignment" -.RE -.TP -\fB\-walign \fR -Do viterbi alignment per word units for the recognition -result. The word boundary frames and the average acoustic -scores per frame will be calculated. -.TP -\fB\-palign \fR -Do viterbi alignment per phone units for the recognition -result. The phone boundary frames and the average acoustic -scores per frame will be calculated. -.TP -\fB\-salign \fR -Do viterbi alignment per state for the recognition result. -The state boundary frames and the average acoustic scores per -frame will be calculated. From sumomo @ users.sourceforge.jp Thu Oct 2 17:23:48 2008 From: sumomo @ users.sourceforge.jp (sumomo @ users.sourceforge.jp) Date: Thu, 02 Oct 2008 17:23:48 +0900 Subject: [Julius-cvs 286] CVS update: julius4/mkbingram Message-ID: <1222935828.860796.32452.nullmailer@users.sourceforge.jp> Index: julius4/mkbingram/00readme-ja.txt diff -u julius4/mkbingram/00readme-ja.txt:1.2 julius4/mkbingram/00readme-ja.txt:1.3 --- julius4/mkbingram/00readme-ja.txt:1.2 Tue Dec 18 23:08:22 2007 +++ julius4/mkbingram/00readme-ja.txt Thu Oct 2 17:23:48 2008 @@ -1,90 +1,86 @@ -MKBINGRAM(1) MKBINGRAM(1) + mkbingram +MKBINGRAM(1) MKBINGRAM(1) -NAME - mkbingram - make binary N-gram from arpa N-gram file -SYNOPSIS - mkbingram -nlr forward_ngram.arpa -nrl backward_ngram.arpa bingram +?? + mkbingram + - ???? N-gram ?? + +?? + mkbingram [-nlr forward_ngram.arpa] [-nrl backward_ngram.arpa] + [-d old_bingram_file] {output_bingram_file} DESCRIPTION - mkbingram ??ARPA?ョ????/??? N-gram ??????ョ?????? - ????????????????????????Julius??????? ? - ???????????? - - Rev.4.0 ???4-gram???-gram???????????????l? 10 - ??? - - ???N-gram? "-nlr" ?????????N-gram???? ? ? ? ??? - mkbingram ? ???N-gram????????N-gram???????????? - ?N-gram??????Julius ????? 2-gram ?????1???????2 - ? ????????????????????????????Z?????- ?ッ?????? - - ???N-gram? "-nrl" ?????????N-gram???? ? ? ? ??? - mkbingram?????N-gram????????N-gram???????????? - ?N-gram??????Julius ???????? 2-gram ??????????- ???????????ッ?????2??????? N-gram?????ッ? - ????? - - ???????????????N-gram??2-gram????N-gram???? ? - ?????N-gram????????Julius???????2-gram??1???? - ?????N-gram??2??????????? N-gram ?????????? - ? ??????????????????????????????C?? - ????????????????? - - mkbingram ? gzip ?????ARPA ???????????????? - - 4.0???Julius????mkbingram????????????N-gram??? ? - ?? 3.x??????????????????? + mkbingram ??ARPA?ョ? N-gram ???????Julius??????N-gram + ??????????????????????????????Julius?? + ????????????? + + Julius-4???N-gram ???????????????????????? + ???????mkbingram ????????????????N-gram???? + ?? ????????????????????C???2??N-gram??? + ?? ???N-gram???????? + + ???N-gram???????????mkbingram ? ???N-gram????? + ???N-gram?????????????N-gram??????Julius ??? + ?? 2-gram ?????1???????2 ? ?????????????? + ??????????????Z?????Fッ?????? + + ???N-gram???????????mkbingram?????N-gram????? + ???N-gram?????????????N-gram??????Julius ??? + ????? 2-gram ??????????Z??????????ッ???? + ?2??????? N-gram?????ッ?????? + + ???????????????N-gram??2-gram????N-gram????? + ?????N-gram????????Julius???????2-gram??1??? + ??????N-gram??2??????????? N-gram ???????? + ??? ??????????????????????????????C + ??????????????????? + + ???mkbingram ? gzip ?????ARPA ?????????????? + ?? + + ????? 3.x ???????????N-gram?????? 4.0 ????? + ??mkbingram ? -d ???????????????ョ ????????? + ョ????????????????4.0 ??? mkbingram ???????? + ?N-gram?????3.x ?????????? ????????????? + ?? OPTIONS - -nlr forward_ngram.arpa - ARPA??`ョ?????? N-gram ????? - - -nrl backward_ngram.arpa - ARPA??`ョ?????? N-gram ????? - - -d ????N-gram - ?????????N-gram???????????N-gram?????? - - bingram - ??t????Julius??????ョ? + -nlr forward_ngram.arpa + ????left-to-right??ARPA?ョ N-gram ????????? -EXAMPLE - ARPA?ョ?N-gram??????ョ?????? + -nrl backward_ngram.arpa + ?????right-to-left??ARPA?ョ N-gram ????????? - % mkbingram -nlr ARPA_2gram -nrl ARPA_rev_3gram outfile + -d old_bingram_file + ????N-gram?????????????ョ????? - ??????N-gram?????3.5????ョ?????? - - % mkbingram -d old_bingram new_bingram - - -USAGE - Julius ????????????? ARPA ?ョ????? "-nlr 2gramfile - -nrl rev3gramfile" ??????? mkbingram ??????????ョ?? - ??? "-d bingramfile" ??????? + output_bingram_file + ????o???N-gram????? + +EXAMPLES + ARPA?ョ? N-gram ??????ョ?????????+?????? + ARPA?ョ???? 4-gram ??????ョ????????????? + ??????N-gram?????????ョ?????? SEE ALSO - julius(1) - -BUGS - ??????????????? ? ? ? julius-info at lists.source- - forge.jp ????????? + julius ( 1 ) , + mkbinhmm ( 1 ) COPYRIGHT - Copyright (c) 1991-2007 ???? ????コ - Copyright (c) 2000-2005 ?????????w??? ュ???コ - Copyright (c) 2005-2007 ??????? Julius????? + Copyright (c) 1991-2008 ???? ????コ + + Copyright (c) 1997-2000 ????U?????(IPA) + + Copyright (c) 2000-2008 ?????????w??? ュ???コ -AUTHORS - ? ?? (???????) ?タ?????? + Copyright (c) 2005-2008 ??????? Julius????? LICENSE Julius ??????????D -4.3 Berkeley Distribution LOCAL MKBINGRAM(1) + 10/02/2008 MKBINGRAM(1) Index: julius4/mkbingram/00readme.txt diff -u julius4/mkbingram/00readme.txt:1.2 julius4/mkbingram/00readme.txt:1.3 --- julius4/mkbingram/00readme.txt:1.2 Tue Dec 18 23:08:22 2007 +++ julius4/mkbingram/00readme.txt Thu Oct 2 17:23:48 2008 @@ -1,89 +1,94 @@ + mkbingram + MKBINGRAM(1) MKBINGRAM(1) NAME - mkbingram - make binary N-gram from arpa N-gram file + mkbingram + - make binary N-gram from ARPA N-gram file SYNOPSIS - mkbingram -nlr forward_ngram.arpa -nrl backward_ngram.arpa bingram + mkbingram [-nlr forward_ngram.arpa] [-nrl backward_ngram.arpa] + [-d old_bingram_file] {output_bingram_file} DESCRIPTION - mkbingram makes a binary N-gram file for Julius from forward (left-to- - right) word N-gram and/or backward (right-to-left) word N-gram LMs in - ARPA standard format. Using the binary file, the initial startup of - Julius becomes much faster. - - From rev. 4.0, longer N-gram (N < 10) is supported. - - When only a forward N-gram is specified by "-nlr" and no backward N- - gram is specified, mkbingram generates binary N-gram for recognition - with only the forward N-gram. The 1st pass will use the 2-gram entry - in the given N-gram, and The 2nd pass will use the given N-gram, with - converting forward probabilities to backward probabilities by Bayes + mkbingram is a tool to convert N-gram definition file(s) in ARPA + standard format to a compact Julius binary format. It will speed up the + initial loading time of N-gram much faster. It can read gzipped file + directly. + + From rev.4.0, Julius can deal with forward N-gram, backward N-gram and + their combinations. So, mkbingram now generates binary N-gram file from + one of them, or combining them two to produce one binary N-gram. + + When only a forward N-gram is specified, mkbingram generates binary + N-gram from only the forward N-gram. When using this binary N-gram at + Julius, it performs the 1st pass with the 2-gram probabilities in the + N-gram, and run the 2nd pass with the given N-gram fully, with + converting forward probabilities to backward probabilities by Bayes rule. - When only a backward N-gram is specified by "-nrl" and no forward N- - gram is specified, mkbingram generates binary N-gram for recognition - with only the backward N-gram. The 1st pass will use the forward - 2-gram probability computed from the backward 2-gram using Bayes rule. - The 2nd pass fully use the given backward N-gram. - - When both forward and backward N-grams are specified, forward 2-gram - part and backward N-gram are gathered together into single bingram - file, to use the forward 2-gram for the 1st pass and backward N-gram - for the 2nd pass. Note that both N-gram should be trained in the same - corpus with same parameters (i.e. cut-off thresholds), with same vocab- - ulary. - - mkbingram can read gzipped ARPA file. + When only a backward N-gram is specified, mkbingram generates an binary + N-gram file that contains only the backward N-gram. The 1st pass will + use forward 2-gram probabilities that can be computed from the backward + 2-gram using Bayes rule, and the 2nd pass use the given backward N-gram + fully. + + When both forward and backward N-grams are specified, the 2-gram part + in the forward N-gram and all backward N-gram will be combined into + single bingram file. The forward 2-gram will be applied for the 1st + pass and backward N-gram for the 2nd pass. Note that both N-gram should + be trained in the same corpus with same parameters (i.e. cut-off + thresholds), with same vocabulary. + + The old binary N-gram produced by mkbingram of version 3.x and earlier + can be used in Julius-4, but you can convert the old version to the new + version by specifying it as input of current mkbingram by option "-d". - Please note that binary N-gram file converted by mkbingram of version - 4.0 and later cannot be read by Julius 3.x. + Please note that binary N-gram file converted by mkbingram of version + 4.0 and later cannot be read by older Julius 3.x. OPTIONS - -nlr forward_ngram.arpa - Forward (left-to-right) word N-gram file in ARPA standard for- - mat. - - -nrl backward_ngram.arpa - Backward (right-to-left) word N-gram file in ARPA standard for- - mat. - - -d old_bingram - Read in an old binary N-gram file (for conversion to the new - format). - - bingram - output binary N-gram file. - -EXAMPLE - Convert ARPA files to binary format: - - % mkbingram -nlr ARPA_2gram -nrl ARPA_rev_3gram outfile - - Convert old binary N-gram file to new format: - - % mkbingram -d old_bingram new_bingram - + -nlr forward_ngram.arpa + Read in a forward (left-to-right) word N-gram file in ARPA standard + format. + + -nrl backward_ngram.arpa + Read in a backward (right-to-left) word N-gram file in ARPA standard + format. + + -d old_bingram_file + Read in a binary N-gram file. + + output_bingram_file + binary N-gram file name to output. + +EXAMPLES + Convert a set of forward and backward N-gram in ARPA format into Julius + binary form: + Convert a single forward 4-gram in ARPA format into a binary file: + Convert old binary N-gram file to current format: SEE ALSO - julius(1) + julius ( 1 ) , + mkbinhmm ( 1 ) , + mkbinhmmlist ( 1 ) COPYRIGHT - Copyright (c) 1991-2007 Kawahara Lab., Kyoto University - Copyright (c) 2000-2005 Shikano Lab., Nara Institute of Science and + Copyright (c) 1997-2000 Information-technology Promotion Agency, Japan + + Copyright (c) 1991-2008 Kawahara Lab., Kyoto University + + Copyright (c) 2000-2005 Shikano Lab., Nara Institute of Science and Technology - Copyright (c) 2005-2007 Julius project team, Nagoya Institute of Tech- - nology -AUTHORS - LEE Akinobu (Nagoya Institute of Technology, Japan) - contact: julius-info at lists.sourceforge.jp + Copyright (c) 2005-2008 Julius project team, Nagoya Institute of + Technology LICENSE - Same as Julius. + The same as Julius. -4.3 Berkeley Distribution LOCAL MKBINGRAM(1) + 10/02/2008 MKBINGRAM(1) Index: julius4/mkbingram/mkbingram.man diff -u julius4/mkbingram/mkbingram.man:1.2 julius4/mkbingram/mkbingram.man:removed --- julius4/mkbingram/mkbingram.man:1.2 Tue Dec 18 23:08:22 2007 +++ julius4/mkbingram/mkbingram.man Thu Oct 2 17:23:48 2008 @@ -1,83 +0,0 @@ -.de Sp -.if t .sp .5v -.if n .sp -.. -.de Ip -.br -.ie \\n.$>=3 .ne \\$3 -.el .ne 3 -.IP "\\$1" \\$2 -.. -.TH MKBINGRAM 1 LOCAL -.UC 6 -.SH NAME -mkbingram - make binary N-gram from arpa N-gram file -.SH SYNOPSIS -.B mkbingram -nlr forward_ngram.arpa -nrl backward_ngram.arpa bingram -.SH DESCRIPTION -.I mkbingram -makes a binary N-gram file for Julius from forward (left-to-right) -word N-gram and/or backward (right-to-left) word N-gram LMs in ARPA -standard format. Using the binary file, the initial startup of Julius -becomes much faster. -.PP -From rev. 4.0, longer N-gram (N < 10) is supported. -.PP -When only a forward N-gram is specified by "-nlr" and no backward -N-gram is specified, mkbingram generates binary N-gram for recognition -with only the forward N-gram. The 1st pass will use the 2-gram entry -in the given N-gram, and The 2nd pass will use the given N-gram, with -converting forward probabilities to backward probabilities by Bayes -rule. -.PP -When only a backward N-gram is specified by "-nrl" and no forward -N-gram is specified, mkbingram generates binary N-gram for recognition -with only the backward N-gram. The 1st pass will use the forward -2-gram probability computed from the backward 2-gram using Bayes rule. -The 2nd pass fully use the given backward N-gram. -.PP -When both forward and backward N-grams are specified, forward 2-gram -part and backward N-gram are gathered together into single bingram -file, to use the forward 2-gram for the 1st pass and backward N-gram -for the 2nd pass. Note that both N-gram should be trained in the same -corpus with same parameters (i.e. cut-off thresholds), with same -vocabulary. -.PP -.I mkbingram -can read gzipped ARPA file. -.PP -Please note that binary N-gram file converted by mkbingram of version -4.0 and later cannot be read by Julius 3.x. -.SH OPTIONS -.Ip "-nlr forward_ngram.arpa" -Forward (left-to-right) word N-gram file in ARPA standard format. -.Ip "-nrl backward_ngram.arpa" -Backward (right-to-left) word N-gram file in ARPA standard format. -.Ip "-d old_bingram" -Read in an old binary N-gram file (for conversion to the new format). -.Ip "bingram" -output binary N-gram file. -.SH EXAMPLE -Convert ARPA files to binary format: -.PP - % mkbingram -nlr ARPA_2gram -nrl ARPA_rev_3gram outfile -.PP -Convert old binary N-gram file to new format: -.PP - % mkbingram -d old_bingram new_bingram - -.SH "SEE ALSO" -julius(1) -.SH COPYRIGHT -Copyright (c) 1991-2007 Kawahara Lab., Kyoto University -.br -Copyright (c) 2000-2005 Shikano Lab., Nara Institute of Science and Technology -.br -Copyright (c) 2005-2007 Julius project team, Nagoya Institute of Technology -.SH AUTHORS -LEE Akinobu (Nagoya Institute of Technology, Japan) -.br -contact: julius-info at lists.sourceforge.jp -.SH LICENSE -Same as -.I Julius. Index: julius4/mkbingram/mkbingram.man.ja diff -u julius4/mkbingram/mkbingram.man.ja:1.2 julius4/mkbingram/mkbingram.man.ja:removed --- julius4/mkbingram/mkbingram.man.ja:1.2 Tue Dec 18 23:08:22 2007 +++ julius4/mkbingram/mkbingram.man.ja Thu Oct 2 17:23:48 2008 @@ -1,86 +0,0 @@ -.de Sp -.if t .sp .5v -.if n .sp -.. -.de Ip -.br -.ie \\n.$>=3 .ne \\$3 -.el .ne 3 -.IP "\\$1" \\$2 -.. -.TH MKBINGRAM 1 LOCAL -.UC 6 -.SH NAME -mkbingram - make binary N-gram from arpa N-gram file -.SH SYNOPSIS -.B mkbingram -nlr forward_ngram.arpa -nrl backward_ngram.arpa bingram -.SH DESCRIPTION -.I mkbingram -は,ARPA形式の前向き/後向き N-gram をバイナリ形式のファイルに結合・変 -換するツールです.これを使用することで,Juliusの起動を大幅に高速化する -ことができます. -.PP -Rev.4.0 からは4-gram以上のN-gramも扱えるようになりました.上限値は 10 -です. -.PP -前向きN-gramが "-nlr" で指定され,後向きN-gramが指定されない場合, -mkbingramは前向きN-gramだけからバイナリN-gramを生成します.この -バイナリN-gramを使うとき,Julius はその中の 2-gram を使って第1パスを -行い,第2パスではその前向き確率から後向きの確率を,ベイズ則に従って -算出しながら認識を行います. -.PP -後向きN-gramが "-nrl" で指定され,前向きN-gramが指定されない場合, -mkbingramは後ろ向きN-gramだけからバイナリN-gramを生成します.このバイ -ナリN-gramを使うとき,Julius はその中の後向き 2-gram からベイズ則に従っ -て算出しながら第1パスの認識を行い,第2パスでは後向き N-gramを使った -認識を行います. -.PP -両方が指定されたときは,前向きN-gram中の2-gramと後向きN-gramが統合され -たバイナリN-gramが生成されます.Juliusではその前向き2-gramで第1パスを -行い,後向きN-gramで第2パスを行います.なお両 N-gram は同一のコーパス -から同一の条件(カットオフ値,バックオフ計算方法等)で学習されてあり, -同一の語彙を持っている必要があります. -.PP -.I mkbingram -は gzip 圧縮された ARPA ファイルをそのまま読み込めます. -.PP -4.0以降のJuliusに付属のmkbingramを使って変換したバイナリN-gramファイルは, -3.xでは読み込めませんのでご注意ください. -.SH OPTIONS -.Ip "-nlr forward_ngram.arpa" -ARPA標準形式の前向き単語 N-gram ファイル. -.Ip "-nrl backward_ngram.arpa" -ARPA標準形式の逆向き単語 N-gram ファイル. -.Ip "-d バイナリN-gram" -入力とするバイナリN-gramファイル(古いバイナリN-gramの再変換用) -.Ip "bingram" -出力ファイル(Julius用バイナリ形式) -.SH EXAMPLE -ARPA形式のN-gramをバイナリ形式に変換する: -.PP - % mkbingram -nlr ARPA_2gram -nrl ARPA_rev_3gram outfile -.PP -古いバイナリN-gramファイルを3.5以降の形式に変換する: -.PP - % mkbingram -d old_bingram new_bingram - -.SH USAGE -Julius で言語モデル指定時に,元の ARPA 形式ファイルを "-nlr 2gramfile --nrl rev3gramfile" とする代わりに mkbingram で変換したバイナリ形式ファ -イルを "-d bingramfile" と指定します. -.SH "SEE ALSO" -julius(1) -.SH BUGS -バグ報告・問い合わせ・コメントなどは -julius-info at lists.sourceforge.jp までお願いします. -.SH COPYRIGHT -Copyright (c) 1991-2007 京都大学 河原研究室 -.br -Copyright (c) 2000-2005 奈良先端科学技術大学院大学 鹿野研究室 -.br -Copyright (c) 2005-2007 名古屋工業大学 Julius開発チーム -.SH AUTHORS -李 晃伸 (名古屋工業大学) が実装しました. -.SH LICENSE -.I Julius -の使用許諾に準じます. From sumomo @ users.sourceforge.jp Thu Oct 2 17:23:49 2008 From: sumomo @ users.sourceforge.jp (sumomo @ users.sourceforge.jp) Date: Thu, 02 Oct 2008 17:23:49 +0900 Subject: [Julius-cvs 287] CVS update: julius4/mkbinhmm Message-ID: <1222935829.084726.32465.nullmailer@users.sourceforge.jp> Index: julius4/mkbinhmm/00readme-ja.txt diff -u julius4/mkbinhmm/00readme-ja.txt:1.2 julius4/mkbinhmm/00readme-ja.txt:1.3 --- julius4/mkbinhmm/00readme-ja.txt:1.2 Tue Dec 18 23:08:22 2007 +++ julius4/mkbinhmm/00readme-ja.txt Thu Oct 2 17:23:48 2008 @@ -1,64 +1,66 @@ + mkbinhmm + MKBINHMM(1) MKBINHMM(1) -NAME - mkbinhmm - convert HMM definition file to binary format for Julius +?? + mkbinhmm + - ???? HMM ?? -SYNOPSIS - mkbinhmm [-C HTK_Config] hmmdefs_file binhmm_file +?? + mkbinhmm [-htkconf HTKConfigFile] {hmmdefs_file} {binhmm_file} DESCRIPTION - mkbinhmm ??HTK?ョ??????ョ?HMM???????Julius?????? - ?ョ??????????????ョ?HMM????????????? ? ? - ?? Julius???????????????? + mkbinhmm ??HTK??????ョ?HMM????????Julius????? ? + ?ョ??????????????? Julius??????????????? + ?? + + ????????????????t????????????????? + ??????????????????o???? HTK Config ????? + "-htkconf" ??????????????????????? ?ッ??ゥ + ??????????p??????????????????? + + ??????HTK?????ョ????????????Julius?????HMM + ????????????-htkconf ??????? ???????HMM??? + ?????????????????????? mkbinhmm ? gzip ?????MM?????????????????? - ????HMM???p???????????????? HTK Config ???? - ? "-C" ???? "-htkconf" ?????????????????????- ??t????????????????Julius ????????????? - ???????????????ゥ???????????????????- ? ????????????????????g??????????Julius - ?ゥ???????????????? - - ??????????ョ??????HMM?????????????? ? ? - ???????????HMM?????????????????????? - ?????????????????????? Config ???????? ? - ??????C??????o?????? - OPTIONS - -C ConfigFile - ????????o?????HTK Config????????????? - ????C??????t??????????????? - - -htkconf ConfigFile - "-C" ???? - -USAGE - ?????ョHMM??????Julius??????Julius ???????? ? - ?? ?? ASCII?ョ?????????????????????????? - ascii/binary ??ョ?Julius?ゥ???????????????????? - ????Julius ?????????Z????? + -htkconf HTKConfigFile + ????????o?????HTK Config????????????? ? + ???C??????????t??????????????? ??? + ????????????????D + + hmmdefs_file + ??????????????? (MMF)?HTK ASCII ?ョ????? + Julius ?????ョ? + + hmmdefs_file + Julius??????ョ????????D + +EXAMPLES + HTK ASCII ?ョ? HMM ????????ョ?????? + HTK??????? Config ?????????????o?? + ???????ョ????????????????F SEE ALSO - julius(1) - -BUGS - ? ? ? ?? ? ? ??????????? julius-info at lists.source- - forge.jp ????????? + julius ( 1 ) , + mkbingram ( 1 ) COPYRIGHT - Copyright (c) 2003-2006 ???? ????コ - Copyright (c) 2003-2005 ?????????w??? ュ???コ - Copyright (c) 2005-2006 ??????? Julius????? + Copyright (c) 1991-2008 ???? ????コ + + Copyright (c) 1997-2000 ????U?????(IPA) + + Copyright (c) 2000-2008 ?????????w??? ュ???コ -AUTHORS - ? ?? (???????) ?タ?????? + Copyright (c) 2005-2008 ??????? Julius????? LICENSE Julius ??????????D -4.3 Berkeley Distribution LOCAL MKBINHMM(1) + 10/02/2008 MKBINHMM(1) Index: julius4/mkbinhmm/00readme.txt diff -u julius4/mkbinhmm/00readme.txt:1.2 julius4/mkbinhmm/00readme.txt:1.3 --- julius4/mkbinhmm/00readme.txt:1.2 Tue Dec 18 23:08:22 2007 +++ julius4/mkbinhmm/00readme.txt Thu Oct 2 17:23:48 2008 @@ -1,66 +1,78 @@ + mkbinhmm + MKBINHMM(1) MKBINHMM(1) NAME - mkbinhmm - convert HMM definition file to binary format for Julius + mkbinhmm + - convert HMM definition file in HTK ascii format to Julius binary + format SYNOPSIS - mkbinhmm [-C HTK_Config] hmmdefs_file binhmm_file + mkbinhmm [-htkconf HTKConfigFile] {hmmdefs_file} {binhmm_file} DESCRIPTION - mkbinhmm convert an ascii hmmdefs in HTK format to a binary HMM defini- - tion file for Julius. + mkbinhmm convert an HMM definition file in HTK ascii format into a + binary HMM file for Julius. It will greatly speed up the launch + process. + + You can also embed acoustic analysis condition parameters needed for + recognition into the output file. To embed the parameters, specify the + HTK Config file you have used to extract acoustic features for training + the HMM by the optione "-htkconf". + + The embedded parameters in a binary HMM format will be loaded into + Julius automatically, so you do not need to specify the acoustic + feature options at run time. It will be convenient when you deliver an + acoustic model. + + You can also specify binary file as the input. This can be used to + update the old binary format into new one, or to embed the config + parameters into the already existing binary files. If the input binhmm + already has acoustic analysis parameters embedded, they will be + overridden by the specified values. - mkbinhmm can read gzipped hmmdefs file. - By specifying the HTK Config file you used for training, you can embed - the acoustic analysis conditions and variables used for the training - into the output file. You can specify the Config file by either "-C" - or "-htkconf". The vaules in the Config file will be converted to - Julius specifications and embedded to the output file. At run time, - the values will be loaded into Julius and appropriate acoustic analysis - parameters for the model will be automatically set. This will greatly - help ensuring the same acoustic conditions to be applied at both train- - ing and application time for waveform recognition. - - You can also specify a binary HMM as input file. This is for only - embedding Config parameters into the already existing binary files. If - the input binhmm already has acoustic analysis parameters embedded, - they will be overridden by the specified HTK Config values. + mkbinhmm can read gzipped file as input. OPTIONS - -C ConfigFile - HTK Config file you used at training time. If specified, the - values are embedded to the output file. - - -htkconf ConfigFile - Same as "-C". - -USAGE - At Julius, this binary hmmdefs can be used in the same way as the orig- - inal ascii format, i.e. "-h". The ascii/binary format will be automat- - icall detected by Julius. If Config parameters are embedded, the val- - ues are loaded into Julius and acoustic analysis parameters will be set - to the values. + -htkconf HTKConfigFile + HTK Config file you used at training time. If specified, the values + are embedded to the output file. + + hmmdefs_file + The source HMm definitino file in HTK ascii format or Julius binary + format. + + hmmdefs_file + Output file. + +EXAMPLES + Convert HTK ascii format HMM definition file into Julius binary file: + Furthermore, embed acoustic feature parameters as specified by Config + file + Embed the acoustic parameters into an existing binary file SEE ALSO - julius(1) + julius ( 1 ) , + mkbingram ( 1 ) , + mkbinhmmlist ( 1 ) COPYRIGHT - Copyright (c) 2003-2006 Kawahara Lab., Kyoto University - Copyright (c) 2003-2005 Shikano Lab., Nara Institute of Science and + Copyright (c) 1997-2000 Information-technology Promotion Agency, Japan + + Copyright (c) 1991-2008 Kawahara Lab., Kyoto University + + Copyright (c) 2000-2005 Shikano Lab., Nara Institute of Science and Technology - Copyright (c) 2005-2006 Julius project team, Nagoya Institute of Tech- - nology -AUTHORS - LEE Akinobu (Nagoya Institute of Technology, Japan) - contact: julius-info at lists.sourceforge.jp + Copyright (c) 2005-2008 Julius project team, Nagoya Institute of + Technology LICENSE - Same as Julius. + The same as Julius. -4.3 Berkeley Distribution LOCAL MKBINHMM(1) + 10/02/2008 MKBINHMM(1) Index: julius4/mkbinhmm/mkbinhmm.man diff -u julius4/mkbinhmm/mkbinhmm.man:1.1.1.1 julius4/mkbinhmm/mkbinhmm.man:removed --- julius4/mkbinhmm/mkbinhmm.man:1.1.1.1 Fri Sep 28 11:50:56 2007 +++ julius4/mkbinhmm/mkbinhmm.man Thu Oct 2 17:23:49 2008 @@ -1,66 +0,0 @@ -.de Sp -.if t .sp .5v -.if n .sp -.. -.de Ip -.br -.ie \\n.$>=3 .ne \\$3 -.el .ne 3 -.IP "\\$1" \\$2 -.. -.TH MKBINHMM 1 LOCAL -.UC 6 -.SH NAME -mkbinhmm - convert HMM definition file to binary format for Julius -.SH SYNOPSIS -.B mkbinhmm [-C HTK_Config] hmmdefs_file binhmm_file -.SH DESCRIPTION -.I mkbinhmm -convert an ascii hmmdefs in HTK format to a binary HMM definition -file for Julius. -.PP -.I mkbinhmm -can read gzipped hmmdefs file. -.PP -By specifying the HTK Config file you used for training, you can embed -the acoustic analysis conditions and variables used for the training -into the output file. You can specify the Config file by either "-C" -or "-htkconf". The vaules in the Config file will be converted to -Julius specifications and embedded to the output file. At run time, -the values will be loaded into Julius and appropriate acoustic -analysis parameters for the model will be automatically set. -This will greatly help ensuring the same acoustic conditions to be -applied at both training and application time for waveform -recognition. -.PP -You can also specify a binary HMM as input file. This is for -only embedding Config parameters into the already existing binary -files. If the input binhmm already has acoustic analysis parameters -embedded, they will be overridden by the specified HTK Config values. -.SH OPTIONS -.Ip "-C ConfigFile" -HTK Config file you used at training time. If specified, the values -are embedded to the output file. -.Ip "-htkconf ConfigFile" -Same as "-C". -.SH USAGE -At Julius, this binary hmmdefs can be used in the same way as the -original ascii format, i.e. "-h". The ascii/binary format will be -automaticall detected by Julius. If Config parameters are embedded, -the values are loaded into Julius and acoustic analysis parameters -will be set to the values. -.SH "SEE ALSO" -julius(1) -.SH COPYRIGHT -Copyright (c) 2003-2006 Kawahara Lab., Kyoto University -.br -Copyright (c) 2003-2005 Shikano Lab., Nara Institute of Science and Technology -.br -Copyright (c) 2005-2006 Julius project team, Nagoya Institute of Technology -.SH AUTHORS -LEE Akinobu (Nagoya Institute of Technology, Japan) -.br -contact: julius-info at lists.sourceforge.jp -.SH LICENSE -Same as -.I Julius. Index: julius4/mkbinhmm/mkbinhmm.man.ja diff -u julius4/mkbinhmm/mkbinhmm.man.ja:1.1.1.1 julius4/mkbinhmm/mkbinhmm.man.ja:removed --- julius4/mkbinhmm/mkbinhmm.man.ja:1.1.1.1 Fri Sep 28 11:50:56 2007 +++ julius4/mkbinhmm/mkbinhmm.man.ja Thu Oct 2 17:23:49 2008 @@ -1,64 +0,0 @@ -.de Sp -.if t .sp .5v -.if n .sp -.. -.de Ip -.br -.ie \\n.$>=3 .ne \\$3 -.el .ne 3 -.IP "\\$1" \\$2 -.. -.TH MKBINHMM 1 LOCAL -.UC 6 -.SH NAME -mkbinhmm - convert HMM definition file to binary format for Julius -.SH SYNOPSIS -.B mkbinhmm [-C HTK_Config] hmmdefs_file binhmm_file -.SH DESCRIPTION -.I mkbinhmm -は,HTK形式のアスキー形式のHMM定義ファイルをJulius用のバイナリ形式へ変 -換する.これのバイナリ形式のHMM定義ファイルを使用することにより, -Juliusの起動を高速化することができる. -.PP -.I mkbinhmm -は gzip 圧縮されたHMM定義ファイルをそのまま読み込めます. -.PP -変換時にHMMの学習用パラメータファイルの生成に用いた HTK Config ファイ -ルを "-C" あるいは "-htkconf" で指定することで,その音響特徴量抽出条件 -を出力ファイルに埋め込むこと -ができます.Julius は埋め込まれたパラメータを見つけると,その値を -読み込んで自動的に音声データからの音響特徴量条件として用います.これに -よって,モデル学習時に使用した特徴量の設定をJuliusで自動的にセットする -ことができます. -.PP -入力としてバイナリ形式に変換済みのHMMを指定することもできます.これを -使って,既存のバイナリHMMに特徴量抽出条件パラメータを埋め込むことがで -きます.入力に既にパラメータが埋め込まれてかつ Config ファイルが指定さ -れている場合は,上書きされて出力されます. -.SH OPTIONS -.Ip "-C ConfigFile" -学習時に特徴量抽出に使用したHTK Configファイルを指定する.指定された場 -合,その値が出力ファイルのヘッダに埋め込まれる. -.Ip "-htkconf ConfigFile" -"-C" と同じ. -.SH USAGE -バイナリ形式HMM定義モデルをJuliusで使うには,Julius で音響モデル指定時 -に,元の ASCII形式ファイルの代わりにこのファイルを指定するだけでよい. -ascii/binary の形式はJuliusで自動判別される.パラメータが埋め込まれて -いる場合は Julius がそれを読み出してセットする. -.SH "SEE ALSO" -julius(1) -.SH BUGS -バグ報告・問い合わせ・コメントなどは -julius-info at lists.sourceforge.jp までお願いします. -.SH COPYRIGHT -Copyright (c) 2003-2006 京都大学 河原研究室 -.br -Copyright (c) 2003-2005 奈良先端科学技術大学院大学 鹿野研究室 -.br -Copyright (c) 2005-2006 名古屋工業大学 Julius開発チーム -.SH AUTHORS -李 晃伸 (名古屋工業大学) が実装しました. -.SH LICENSE -.I Julius -の使用許諾に準じます. From sumomo @ users.sourceforge.jp Thu Oct 2 17:23:49 2008 From: sumomo @ users.sourceforge.jp (sumomo @ users.sourceforge.jp) Date: Thu, 02 Oct 2008 17:23:49 +0900 Subject: [Julius-cvs 288] CVS update: julius4/mkgshmm Message-ID: <1222935829.317582.32479.nullmailer@users.sourceforge.jp> Index: julius4/mkgshmm/00readme-ja.txt diff -u julius4/mkgshmm/00readme-ja.txt:1.2 julius4/mkgshmm/00readme-ja.txt:1.3 --- julius4/mkgshmm/00readme-ja.txt:1.2 Tue Dec 18 23:08:22 2007 +++ julius4/mkgshmm/00readme-ja.txt Thu Oct 2 17:23:49 2008 @@ -1,60 +1,51 @@ -MKGSHMM(1) MKGSHMM(1) + mkgshmm +MKGSHMM(1) MKGSHMM(1) -NAME - mkgshmm - convert monophone HMM to GS HMM for Julius -SYNOPSIS - mkgshmm monophone_hmmdefs > outputfile +?? + mkgshmm + - ?????HMM? GMS ?????? + +?? + mkgshmm {monophone_hmmdefs} + > + {outputfile} DESCRIPTION mkgshmm ?HTK?ョ?monophone HMM? Julius ? Gaussian Mixture Selection (GMS) ??????perl???????? - GMS?Julius-3.2???????????????????????? ?? ? - ?? ???? monophone ????x?????triphone?PTM????\?? - ?????????????????30%???????? - - -EXAMPLE - ??????????triphone?PTM????????????????mono- - phone ?????????? - - ????monophone???? mkgshmm ???? GMS ????????タ??? - ???`??????????????? - - % mkgshmm monophone > gshmmfile + GMS?Julius-3.2?????????????????????????? ? + ?????? monophone ????x?????triphone?PTM????\ ?? + ?????????????????????? + +EXAMPLES + ??????????triphone?PTM????????????????+ monophone ?????????? + ????monophone???? mkgshmm ???? GMS ???????? ??? Julius ? "-gshmm" ??????? - - % julius -C foo.jconf -gshmm gshmmfile - - ???GMS?????triphone?PTM?????????????????? ? - ? ??????????gshmm ????????????????????? - ???? + GMS?????triphone?PTM?????????????????????? + ????????gshmm ??????????????????????? + ?? SEE ALSO - julius(1) + julius ( 1 ) -BUGS - ??????????????? ? ? ? julius-info at lists.source- - forge.jp ????????? +COPYRIGHT + Copyright (c) 1991-2008 ???? ????コ -VERSION - This version is provided as part of Julius-3.5.1. + Copyright (c) 1997-2000 ????U?????(IPA) -COPYRIGHT - Copyright (c) 2001-2005 ???? ????コ - Copyright (c) 2001-2005 ?????????w??? ュ???コ - Copyright (c) 2005 ??????? Julius????? + Copyright (c) 2000-2008 ?????????w??? ュ???コ -AUTHORS - ? ?? (???????) ?タ?????? + Copyright (c) 2005-2008 ??????? Julius????? LICENSE Julius ??????????D -4.3 Berkeley Distribution LOCAL MKGSHMM(1) + 10/02/2008 MKGSHMM(1) Index: julius4/mkgshmm/00readme.txt diff -u julius4/mkgshmm/00readme.txt:1.1.1.1 julius4/mkgshmm/00readme.txt:1.2 --- julius4/mkgshmm/00readme.txt:1.1.1.1 Fri Sep 28 11:50:56 2007 +++ julius4/mkgshmm/00readme.txt Thu Oct 2 17:23:49 2008 @@ -1,56 +1,50 @@ + mkgshmm + MKGSHMM(1) MKGSHMM(1) NAME - mkgshmm - convert monophone HMM to GS HMM for Julius + mkgshmm + - convert monophone HMM to GS HMM for Julius SYNOPSIS - mkgshmm monophone_hmmdefs > outputfile + mkgshmm {monophone_hmmdefs} + > + {outputfile} DESCRIPTION - mkgshmm converts monophone HMM definition file (hmmdefs) in HTK format - to a special format for Gaussian Mixture Selection (GMS) in Julius. + mkgshmm converts monophone HMM definition file in HTK format into a + special format for Gaussian Mixture Selection (GMS) in Julius. - GMS is an algorithm to reduce the amount of acoustic computation with - triphone HMM, by pre-selection of promising gaussian mixtures using + GMS is an algorithm to reduce the amount of acoustic computation with + triphone HMM, by pre-selection of promising gaussian mixtures using likelihoods of corresponding monophone mixtures. - For more details, please consult related documents and papers - -EXAMPLE - (1) Prepare a monophone model which was trained by the same corpus as +EXAMPLES + (1) Prepare a monophone model which was trained by the same corpus as target triphone model. (2) Convert the monophone model using mkgshmm. - - % mkgshmm monophone > gshmmfile - (3) Specify the output file in Julius with option "-gshmm" - % julius -C foo.jconf -gshmm gshmmfile - - SEE ALSO - julius(1) - -VERSION - This version is provided as part of Julius-3.5.1. + julius ( 1 ) COPYRIGHT - Copyright (c) 2001-2005 Kawahara Lab., Kyoto University - Copyright (c) 2001-2005 Shikano Lab., Nara Institute of Science and + Copyright (c) 1997-2000 Information-technology Promotion Agency, Japan + + Copyright (c) 1991-2008 Kawahara Lab., Kyoto University + + Copyright (c) 2000-2005 Shikano Lab., Nara Institute of Science and Technology - Copyright (c) 2005 Julius project team, Nagoya Institute of Tech- - nology -AUTHORS - LEE Akinobu (Nagoya Institute of Technology, Japan) - contact: julius-info at lists.sourceforge.jp + Copyright (c) 2005-2008 Julius project team, Nagoya Institute of + Technology LICENSE - Same as Julius. + The same as Julius. -4.3 Berkeley Distribution LOCAL MKGSHMM(1) + 10/02/2008 MKGSHMM(1) Index: julius4/mkgshmm/mkgshmm.man diff -u julius4/mkgshmm/mkgshmm.man:1.1.1.1 julius4/mkgshmm/mkgshmm.man:removed --- julius4/mkgshmm/mkgshmm.man:1.1.1.1 Fri Sep 28 11:50:56 2007 +++ julius4/mkgshmm/mkgshmm.man Thu Oct 2 17:23:49 2008 @@ -1,58 +0,0 @@ -.de Sp -.if t .sp .5v -.if n .sp -.. -.de Ip -.br -.ie \\n.$>=3 .ne \\$3 -.el .ne 3 -.IP "\\$1" \\$2 -.. -.TH MKGSHMM 1 LOCAL -.UC 6 -.SH NAME -mkgshmm - convert monophone HMM to GS HMM for Julius -.SH SYNOPSIS -.B mkgshmm monophone_hmmdefs > outputfile -.SH DESCRIPTION -.I mkgshmm -converts monophone HMM definition file (hmmdefs) in HTK format to -a special format for Gaussian Mixture Selection (GMS) in -.I Julius. -.PP -GMS is an algorithm to reduce the amount of acoustic computation with -triphone HMM, by pre-selection of promising gaussian mixtures using -likelihoods of corresponding monophone mixtures. -.PP -For more details, please consult related documents and papers -.SH EXAMPLE -.PP -(1) Prepare a monophone model which was trained by the same corpus as -target triphone model. -.PP -(2) Convert the monophone model using -.I mkgshmm. -.PP - % mkgshmm monophone > gshmmfile -.PP -(3) Specify the output file in Julius with option "-gshmm" -.PP - % julius -C foo.jconf -gshmm gshmmfile -.PP -.SH "SEE ALSO" -julius(1) -.SH VERSION -This version is provided as part of Julius-3.5.1. -.SH COPYRIGHT -Copyright (c) 2001-2005 Kawahara Lab., Kyoto University -.br -Copyright (c) 2001-2005 Shikano Lab., Nara Institute of Science and Technology -.br -Copyright (c) 2005 Julius project team, Nagoya Institute of Technology -.SH AUTHORS -LEE Akinobu (Nagoya Institute of Technology, Japan) -.br -contact: julius-info at lists.sourceforge.jp -.SH LICENSE -Same as -.I Julius. Index: julius4/mkgshmm/mkgshmm.man.ja diff -u julius4/mkgshmm/mkgshmm.man.ja:1.1.1.1 julius4/mkgshmm/mkgshmm.man.ja:removed --- julius4/mkgshmm/mkgshmm.man.ja:1.1.1.1 Fri Sep 28 11:50:56 2007 +++ julius4/mkgshmm/mkgshmm.man.ja Thu Oct 2 17:23:49 2008 @@ -1,60 +0,0 @@ -.de Sp -.if t .sp .5v -.if n .sp -.. -.de Ip -.br -.ie \\n.$>=3 .ne \\$3 -.el .ne 3 -.IP "\\$1" \\$2 -.. -.TH MKGSHMM 1 LOCAL -.UC 6 -.SH NAME -mkgshmm - convert monophone HMM to GS HMM for Julius -.SH SYNOPSIS -.B mkgshmm monophone_hmmdefs > outputfile -.SH DESCRIPTION -.I mkgshmm -はHTK形式のmonophone HMMを -.I Julius -の Gaussian Mixture Selection (GMS) 用に変換するperlスクリプトです. -.PP -GMSはJulius-3.2からサポートされている音響尤度計算の高速化手法です. -フレームごとに monophone の状態尤度に基づいてtriphoneやPTMの状態を -予備選択することで,音響尤度計算がおよそ30%高速化されます. -.PP -.SH EXAMPLE -.PP -まずターゲットとするtriphoneやPTMに対して,同じコーパスで学習した monophone モデルを用意します. -.PP -次にそのmonophoneモデルを -.I mkgshmm -を用いて GMS 用に変換します(実際には状態定義をマクロ化しているだけです). -.PP - % mkgshmm monophone > gshmmfile -.PP -これを Julius で "-gshmm" で指定します. -.PP - % julius -C foo.jconf -gshmm gshmmfile -.PP -注意:GMS用モデルはtriphoneやPTMと同一のコーパスから作成する必要がある点に注意してください.gshmm がミスマッチだと選択誤りが生じ,性能が劣化します. -.SH "SEE ALSO" -julius(1) -.SH BUGS -.PP -バグ報告・問い合わせ・コメントなどは -julius-info at lists.sourceforge.jp までお願いします. -.SH VERSION -This version is provided as part of Julius-3.5.1. -.SH COPYRIGHT -Copyright (c) 2001-2005 京都大学 河原研究室 -.br -Copyright (c) 2001-2005 奈良先端科学技術大学院大学 鹿野研究室 -.br -Copyright (c) 2005 名古屋工業大学 Julius開発チーム -.SH AUTHORS -李 晃伸 (名古屋工業大学) が実装しました. -.SH LICENSE -.I Julius -の使用許諾に準じます. From sumomo @ users.sourceforge.jp Thu Oct 2 17:23:49 2008 From: sumomo @ users.sourceforge.jp (sumomo @ users.sourceforge.jp) Date: Thu, 02 Oct 2008 17:23:49 +0900 Subject: [Julius-cvs 289] CVS update: julius4/mkss Message-ID: <1222935829.630301.32493.nullmailer@users.sourceforge.jp> Index: julius4/mkss/00readme-ja.txt diff -u julius4/mkss/00readme-ja.txt:1.2 julius4/mkss/00readme-ja.txt:1.3 --- julius4/mkss/00readme-ja.txt:1.2 Tue Dec 18 23:08:23 2007 +++ julius4/mkss/00readme-ja.txt Thu Oct 2 17:23:49 2008 @@ -1,58 +1,56 @@ + mkss + MKSS(1) MKSS(1) -NAME - mkss - compute average spectrum from mic input for SS +?? + mkss + - ????????????????????????? -SYNOPSIS - mkss [options..] filename +?? + mkss [options...] {filename} DESCRIPTION - mkss ????????????????????????????????? - ???????c??????????t???? Julius ??????? ? - ? ??????????????????????????? "-ssload"?? - ????????? - - ????????s????????????????? - - ????????16bit signed short (big endian), monoral ?????? - ????ョ?RAW(?????)?big endian?ョ?????????????? - ??????????????D - - ???????? "-" ??????????o?????????????D + mkss ????????????????????????????????? + ??????????????????????????? ???????? + ??????? ??????????D?????t?????Julius ?? + ???? ?????????????????????????????? + "-ssload"??????????? + + ???????????????????????16bit signed short (big + endian), monoral ??????????????????????????+ ?????D????????? "-" ?????? ????o??????+ ??? OPTIONS - -freq threshold - ??????????Hz??????(default: 16000) + -freq Hz + ???????????? (Hz) ??????(default: 16,000) - -len msec - ???????????????? (default: 3000)? + -len msec + ???????????????????default: 3000? - -fsize samplenum - ????????????????????? (default: 400)? + -fsize sample_num + ????????????? (default: 400)? - -fshift samplenum - ????????????????????? (default: 160)? + -fshift sample_num + ????????????????? (default: 160)? SEE ALSO - julius(1) - -BUGS - ? ? ? ?? ? ? ??????????? julius-info at lists.source- - forge.jp ????????? + julius ( 1 ) COPYRIGHT - Copyright (c) 2002-2006 ???? ????コ - Copyright (c) 2002-2005 ?????????w??? ュ???コ - Copyright (c) 2005-2006 ??????? Julius????? + Copyright (c) 1991-2008 ???? ????コ + + Copyright (c) 1997-2000 ????U?????(IPA) + + Copyright (c) 2000-2008 ?????????w??? ュ???コ -AUTHORS - ? ?? (???????) ?タ?????? + Copyright (c) 2005-2008 ??????? Julius????? LICENSE Julius ??????????D -4.3 Berkeley Distribution LOCAL MKSS(1) + 10/02/2008 MKSS(1) Index: julius4/mkss/00readme.txt diff -u julius4/mkss/00readme.txt:1.2 julius4/mkss/00readme.txt:1.3 --- julius4/mkss/00readme.txt:1.2 Tue Dec 18 23:08:23 2007 +++ julius4/mkss/00readme.txt Thu Oct 2 17:23:49 2008 @@ -1,58 +1,55 @@ + mkss + MKSS(1) MKSS(1) NAME - mkss - compute average spectrum from mic input for SS + mkss + - calculate average spectrum for spectral subtraction SYNOPSIS - mkss [options..] filename + mkss [options...] {filename} DESCRIPTION - mkss is a tool for estimating noise spectrum for spectral subtraction - on Julius. It reads a few seconds of sound data from microphone input, - and saves the average spectrum to a file. The output file can be used - as a noise spectrum data in Julius (option "-ssload"). + mkss is a tool to estimate noise spectrum for spectral subtraction on + Julius. It reads a few seconds of sound data from microphone input, + calculate the average spectrum and save it to a file. The output file + can be used as a noise spectrum data in Julius (option "-ssload"). - Output format is RAW (no header), 16bit (signed short, big endian), - monoral. If the file already exist, it will be overridden. + The recording will start immediately after startup. Sampling format is + 16bit, monoral. If outpue file already exist, it will be overridden. OPTIONS - -freq threshold - Sampling frequency (Hz, default=16000) + -freq Hz + Sampling frequency in Hz (default: 16,000) - -len msec - length to record in milliseconds (default: 3000). + -len msec + capture length in milliseconds (default: 3000) - -fsize samplenum - frame size in number of samples (default: 400). + -fsize sample_num + frame size in number of samples (default: 400) - -fshift samplenum - frame shift in number of samples (default: 160). - -USAGE - Start mkss and stay quiet for 3 seconds. Then the average noise spec- - trum will be recorded to the specified file. When you start Julius, - specify option "-ssload thatfile", and you can use microphone input - with spectral subtraction. + -fshift sample_num + frame shift in number of samples (default: 160) SEE ALSO - julius(1) + julius ( 1 ) COPYRIGHT - Copyright (c) 2002-2006 Kawahara Lab., Kyoto University - Copyright (c) 2002-2005 Shikano Lab., Nara Institute of Science and + Copyright (c) 1997-2000 Information-technology Promotion Agency, Japan + + Copyright (c) 1991-2008 Kawahara Lab., Kyoto University + + Copyright (c) 2000-2005 Shikano Lab., Nara Institute of Science and Technology - Copyright (c) 2005-2006 Julius project team, Nagoya Institute of Tech- - nology -AUTHORS - LEE Akinobu (Nagoya Institute of Technology, Japan) - contact: julius-info at lists.sourceforge.jp + Copyright (c) 2005-2008 Julius project team, Nagoya Institute of + Technology LICENSE - Same as Julius. + The same as Julius. -4.3 Berkeley Distribution LOCAL MKSS(1) + 10/02/2008 MKSS(1) Index: julius4/mkss/mkss.man diff -u julius4/mkss/mkss.man:1.1.1.1 julius4/mkss/mkss.man:removed --- julius4/mkss/mkss.man:1.1.1.1 Fri Sep 28 11:50:56 2007 +++ julius4/mkss/mkss.man Thu Oct 2 17:23:49 2008 @@ -1,56 +0,0 @@ -.de Sp -.if t .sp .5v -.if n .sp -.. -.de Ip -.br -.ie \\n.$>=3 .ne \\$3 -.el .ne 3 -.IP "\\$1" \\$2 -.. -.TH MKSS 1 LOCAL -.UC 6 -.SH NAME -mkss - compute average spectrum from mic input for SS -.SH SYNOPSIS -.B mkss [options..] filename -.SH DESCRIPTION -.I mkss -is a tool for estimating noise spectrum for spectral subtraction on -Julius. It reads a few seconds of sound data from microphone -input, and saves the average spectrum to a file. The output file can -be used as a noise spectrum data in -.I Julius -(option "-ssload"). -.PP -Output format is RAW (no header), 16bit (signed short, big endian), -monoral. If the file already exist, it will be overridden. -.SH OPTIONS -.Ip "\-freq threshold" -Sampling frequency (Hz, default=16000) -.Ip "\-len msec" -length to record in milliseconds (default: 3000). -.Ip "\-fsize samplenum" -frame size in number of samples (default: 400). -.Ip "\-fshift samplenum" -frame shift in number of samples (default: 160). -.SH "USAGE" -Start mkss and stay quiet for 3 seconds. Then the average noise -spectrum will be recorded to the specified file. When you start -Julius, specify option "-ssload thatfile", and you can use microphone -input with spectral subtraction. -.SH "SEE ALSO" -julius(1) -.SH COPYRIGHT -Copyright (c) 2002-2006 Kawahara Lab., Kyoto University -.br -Copyright (c) 2002-2005 Shikano Lab., Nara Institute of Science and Technology -.br -Copyright (c) 2005-2006 Julius project team, Nagoya Institute of Technology -.SH AUTHORS -LEE Akinobu (Nagoya Institute of Technology, Japan) -.br -contact: julius-info at lists.sourceforge.jp -.SH LICENSE -Same as -.I Julius. Index: julius4/mkss/mkss.man.ja diff -u julius4/mkss/mkss.man.ja:1.1.1.1 julius4/mkss/mkss.man.ja:removed --- julius4/mkss/mkss.man.ja:1.1.1.1 Fri Sep 28 11:50:56 2007 +++ julius4/mkss/mkss.man.ja Thu Oct 2 17:23:49 2008 @@ -1,56 +0,0 @@ -.de Sp -.if t .sp .5v -.if n .sp -.. -.de Ip -.br -.ie \\n.$>=3 .ne \\$3 -.el .ne 3 -.IP "\\$1" \\$2 -.. -.TH MKSS 1 LOCAL -.UC 6 -.SH NAME -mkss - compute average spectrum from mic input for SS -.SH SYNOPSIS -.B mkss [options..] filename -.SH DESCRIPTION -.I mkss -は指定時間分の音をマイク入力から録音し,その平均スペクトラムをファイルに -出力するツールです.出力されたファイルは -.I Julius -でスペクトルサブトラクションのためのノイズスペクトルファイル -(オプション "-ssload")として利用できます. -.PP -音声の切り出しは行わず,起動と同時に録音を始めます. -.PP -サンプリング条件は16bit signed short (big endian), monoral で固定です. -データ形式はRAW(ヘッダ無し),big endian形式です. -既に同じ名前のファイルが存在する場合は上書きします. -.PP -なおファイル名に "-" を指定することで標準出力へ出力することもできます. -.SH OPTIONS -.Ip "\-freq threshold" -サンプリング周波数をHzで指定する.(default: 16000) -.Ip "\-len msec" -録音時間長をミリ秒単位で指定する (default: 3000). -.Ip "\-fsize samplenum" -分析のフレームサイズをサンプル数で指定する (default: 400). -.Ip "\-fshift samplenum" -分析のフレームシフトをサンプル数で指定する (default: 160). -.SH "SEE ALSO" -julius(1) -.SH BUGS -バグ報告・問い合わせ・コメントなどは -julius-info at lists.sourceforge.jp までお願いします. -.SH COPYRIGHT -Copyright (c) 2002-2006 京都大学 河原研究室 -.br -Copyright (c) 2002-2005 奈良先端科学技術大学院大学 鹿野研究室 -.br -Copyright (c) 2005-2006 名古屋工業大学 Julius開発チーム -.SH AUTHORS -李 晃伸 (名古屋工業大学) が実装しました. -.SH LICENSE -.I Julius -の使用許諾に準じます. From sumomo @ users.sourceforge.jp Thu Oct 2 17:23:49 2008 From: sumomo @ users.sourceforge.jp (sumomo @ users.sourceforge.jp) Date: Thu, 02 Oct 2008 17:23:49 +0900 Subject: [Julius-cvs 290] CVS update: julius4/support Message-ID: <1222935829.787593.32502.nullmailer@users.sourceforge.jp> Index: julius4/support/makeman.sh diff -u julius4/support/makeman.sh:1.1.1.1 julius4/support/makeman.sh:1.2 --- julius4/support/makeman.sh:1.1.1.1 Fri Sep 28 11:50:56 2007 +++ julius4/support/makeman.sh Thu Oct 2 17:23:49 2008 @@ -1,9 +1,10 @@ #!/bin/sh # -# usage: makeman.sh julius.man +# Update 00readme.txt and 00readme-ja.txt from man file. +# +# usage: makeman.sh generate gramtools/generate # -# generate julius.man.txt, julius.man.txt.ja # -nroff -man $1 | sed -e 's/.//g' | nkf -c > $1.txt -LANG=ja_JP.eucJP nroff -Tnippon -man $1.ja | sed -e 's/.//g' | nkf -s -c > $1.txt.ja -#man -Tps -l $1 > $1.txt.ps +nroff -man man/$1.1 | sed -e 's/.//g' | nkf -c > $2/00readme.txt +LANG=ja_JP.eucJP nroff -Tnippon -man man/ja/$1.1 | sed -e 's/.//g' | nkf -s -c > $2/00readme-ja.txt +echo $1 "->" $2 Index: julius4/support/update-mantxt.sh diff -u julius4/support/update-mantxt.sh:1.2 julius4/support/update-mantxt.sh:1.3 --- julius4/support/update-mantxt.sh:1.2 Tue Dec 18 23:08:23 2007 +++ julius4/support/update-mantxt.sh Thu Oct 2 17:23:49 2008 @@ -4,36 +4,29 @@ # # should be invoked at parent directory. # +# The new manuals should be located at man and man/ja. +# # If conversion fails, see makeman.sh in this directory. # -tools_man="\ -./adinrec/adinrec.man \ -./adintool/adintool.man \ -./jcontrol/jcontrol.man \ -./mkbingram/mkbingram.man \ -./mkbinhmm/mkbinhmm.man \ -./mkgshmm/mkgshmm.man \ -./mkss/mkss.man \ -" - -############################## - -for m in $tools_man; do - echo $m - ./support/makeman.sh $m - mv $m.txt `dirname $m`/00readme.txt - mv $m.txt.ja `dirname $m`/00readme-ja.txt -done - -echo julius/julius.man -./support/makeman.sh julius/julius.man -mv julius/julius.man.txt julius/00readme.txt -mv julius/julius.man.txt.ja julius/00readme-ja.txt +echo 'Did you placed all the new manuals in "man" and "man/ja/" ?' -echo libjulius/jconf.man -./support/makeman.sh libjulius/jconf.man -mv libjulius/jconf.man.txt libjulius/00readme-jconf.txt -mv libjulius/jconf.man.txt.ja libjulius/00readme-jconf-ja.txt +./support/makeman.sh accept_check gramtools/accept_check +./support/makeman.sh adinrec adinrec +./support/makeman.sh adintool adintool +./support/makeman.sh dfa_determinize gramtools/dfa_determinize +./support/makeman.sh dfa_minimize gramtools/dfa_minimize +./support/makeman.sh generate-ngram generate-ngram +./support/makeman.sh generate gramtools/generate +./support/makeman.sh gram2sapixml.pl gramtools/gram2sapixml +./support/makeman.sh jclient.pl jclient-perl +./support/makeman.sh jcontrol jcontrol +./support/makeman.sh julius julius +./support/makeman.sh mkbingram mkbingram +./support/makeman.sh mkbinhmm mkbinhmm +./support/makeman.sh mkdfa.pl gramtools/mkdfa +./support/makeman.sh mkgshmm mkgshmm +./support/makeman.sh mkss mkss +./support/makeman.sh nextword gramtools/nextword echo Finished. From sumomo @ users.sourceforge.jp Thu Oct 2 17:57:01 2008 From: sumomo @ users.sourceforge.jp (sumomo @ users.sourceforge.jp) Date: Thu, 02 Oct 2008 17:57:01 +0900 Subject: [Julius-cvs 291] CVS update: julius4 Message-ID: <1222937821.585548.29487.nullmailer@users.sourceforge.jp> Index: julius4/Makefile.in diff -u julius4/Makefile.in:1.2 julius4/Makefile.in:1.3 --- julius4/Makefile.in:1.2 Tue Dec 18 17:45:45 2007 +++ julius4/Makefile.in Thu Oct 2 17:57:01 2008 @@ -5,11 +5,11 @@ # # Makefile.in --- Makefile Template for configure # -# $Id: Makefile.in,v 1.2 2007/12/18 08:45:45 sumomo Exp $ +# $Id: Makefile.in,v 1.3 2008/10/02 08:57:01 sumomo Exp $ # SHELL=/bin/sh -SUBDIRS=libsent libjulius julius mkbingram mkbinhmm adinrec adintool mkgshmm mkss jcontrol gramtools generate-ngram +SUBDIRS=libsent libjulius julius mkbingram mkbinhmm adinrec adintool mkgshmm mkss jcontrol gramtools generate-ngram jclient-perl man CONFIG_SUBDIRS=mkgshmm gramtools jcontrol julius libjulius libsent @@ -34,14 +34,7 @@ done install.man: - for d in $(SUBDIRS); do \ - (cd $$d; $(MAKE) install.man); \ - done - -install.man.ja: - for d in $(SUBDIRS); do \ - (cd $$d; $(MAKE) install.man.ja); \ - done + (cd man; $(MAKE) install) clean: for d in $(SUBDIRS); do \ Index: julius4/configure diff -u julius4/configure:1.2 julius4/configure:1.3 --- julius4/configure:1.2 Tue Dec 18 17:45:45 2007 +++ julius4/configure Thu Oct 2 17:57:01 2008 @@ -1101,7 +1101,7 @@ ac_given_srcdir=$srcdir ac_given_INSTALL="$INSTALL" -trap 'rm -fr `echo "Makefile mkbingram/Makefile mkbinhmm/Makefile adinrec/Makefile adintool/Makefile mkss/Makefile generate-ngram/Makefile" | sed "s/:[^ ]*//g"` conftest*; exit 1' 1 2 15 +trap 'rm -fr `echo "Makefile mkbingram/Makefile mkbinhmm/Makefile adinrec/Makefile adintool/Makefile mkss/Makefile generate-ngram/Makefile jclient-perl/Makefile man/Makefile" | sed "s/:[^ ]*//g"` conftest*; exit 1' 1 2 15 EOF cat >> $CONFIG_STATUS <> $CONFIG_STATUS <> $CONFIG_STATUS <<\EOF for ac_file in .. $CONFIG_FILES; do if test "x$ac_file" != x..; then Index: julius4/configure.in diff -u julius4/configure.in:1.2 julius4/configure.in:1.3 --- julius4/configure.in:1.2 Tue Dec 18 17:45:45 2007 +++ julius4/configure.in Thu Oct 2 17:57:01 2008 @@ -3,7 +3,7 @@ dnl Copyright (c) 2005-2007 Julius project team, Nagoya Institute of Technology dnl All rights reserved dnl -dnl $Id: configure.in,v 1.2 2007/12/18 08:45:45 sumomo Exp $ +dnl $Id: configure.in,v 1.3 2008/10/02 08:57:01 sumomo Exp $ dnl AC_INIT(Sample.jconf) AC_CONFIG_AUX_DIR(support) @@ -31,4 +31,4 @@ AC_PROG_INSTALL AC_PATH_PROG(RM, rm) -AC_OUTPUT(Makefile mkbingram/Makefile mkbinhmm/Makefile adinrec/Makefile adintool/Makefile mkss/Makefile generate-ngram/Makefile) +AC_OUTPUT(Makefile mkbingram/Makefile mkbinhmm/Makefile adinrec/Makefile adintool/Makefile mkss/Makefile generate-ngram/Makefile jclient-perl/Makefile man/Makefile) From sumomo @ users.sourceforge.jp Thu Oct 2 17:57:01 2008 From: sumomo @ users.sourceforge.jp (sumomo @ users.sourceforge.jp) Date: Thu, 02 Oct 2008 17:57:01 +0900 Subject: [Julius-cvs 292] CVS update: julius4/adinrec Message-ID: <1222937821.754909.29501.nullmailer@users.sourceforge.jp> Index: julius4/adinrec/Makefile.in diff -u julius4/adinrec/Makefile.in:1.3 julius4/adinrec/Makefile.in:1.4 --- julius4/adinrec/Makefile.in:1.3 Thu Sep 25 13:49:04 2008 +++ julius4/adinrec/Makefile.in Thu Oct 2 17:57:01 2008 @@ -3,7 +3,7 @@ # Copyright (c) 2005-2007 Julius project team, Nagoya Institute of Technology # All rights reserved # -# $Id: Makefile.in,v 1.3 2008/09/25 04:49:04 sumomo Exp $ +# $Id: Makefile.in,v 1.4 2008/10/02 08:57:01 sumomo Exp $ # SHELL=/bin/sh .SUFFIXES: @@ -33,20 +33,12 @@ ############################################################ -install: install.bin install.man +install: install.bin install.bin: $(TARGET) ${INSTALL} -d @bindir@ @INSTALL_PROGRAM@ $(TARGET) @bindir@ -install.man: - ${INSTALL} -d @mandir@/man1 - @INSTALL_DATA@ adinrec.man @mandir@/man1/adinrec.1 - -install.man.ja: - ${INSTALL} -d @mandir@/man1 - @INSTALL_DATA@ adinrec.man.ja @mandir@/man1/adinrec.1 - ############################################################ clean: From sumomo @ users.sourceforge.jp Thu Oct 2 17:57:01 2008 From: sumomo @ users.sourceforge.jp (sumomo @ users.sourceforge.jp) Date: Thu, 02 Oct 2008 17:57:01 +0900 Subject: [Julius-cvs 293] CVS update: julius4/adintool Message-ID: <1222937821.930505.29512.nullmailer@users.sourceforge.jp> Index: julius4/adintool/Makefile.in diff -u julius4/adintool/Makefile.in:1.3 julius4/adintool/Makefile.in:1.4 --- julius4/adintool/Makefile.in:1.3 Thu Sep 25 13:49:04 2008 +++ julius4/adintool/Makefile.in Thu Oct 2 17:57:01 2008 @@ -3,7 +3,7 @@ # Copyright (c) 2005-2007 Julius project team, Nagoya Institute of Technology # All rights reserved # -# $Id: Makefile.in,v 1.3 2008/09/25 04:49:04 sumomo Exp $ +# $Id: Makefile.in,v 1.4 2008/10/02 08:57:01 sumomo Exp $ # SHELL=/bin/sh .SUFFIXES: @@ -33,20 +33,12 @@ ############################################################ -install: install.bin install.man +install: install.bin install.bin: $(TARGET) ${INSTALL} -d @bindir@ @INSTALL_PROGRAM@ $(TARGET) @bindir@ -install.man: - ${INSTALL} -d @mandir@/man1 - @INSTALL_DATA@ adintool.man @mandir@/man1/adintool.1 - -install.man.ja: - ${INSTALL} -d @mandir@/man1 - @INSTALL_DATA@ adintool.man.ja @mandir@/man1/adintool.1 - ############################################################ clean: From sumomo @ users.sourceforge.jp Thu Oct 2 17:57:02 2008 From: sumomo @ users.sourceforge.jp (sumomo @ users.sourceforge.jp) Date: Thu, 02 Oct 2008 17:57:02 +0900 Subject: [Julius-cvs 294] CVS update: julius4/generate-ngram Message-ID: <1222937822.067622.29519.nullmailer@users.sourceforge.jp> Index: julius4/generate-ngram/Makefile.in diff -u julius4/generate-ngram/Makefile.in:1.6 julius4/generate-ngram/Makefile.in:1.7 --- julius4/generate-ngram/Makefile.in:1.6 Thu Sep 25 13:49:04 2008 +++ julius4/generate-ngram/Makefile.in Thu Oct 2 17:57:01 2008 @@ -3,7 +3,7 @@ # Copyright (c) 2005-2007 Julius project team, Nagoya Institute of Technology # All rights reserved # -# $Id: Makefile.in,v 1.6 2008/09/25 04:49:04 sumomo Exp $ +# $Id: Makefile.in,v 1.7 2008/10/02 08:57:01 sumomo Exp $ # SHELL=/bin/sh .SUFFIXES: @@ -29,20 +29,12 @@ $(TARGET): $(OBJ) $(LIBSENT)/libsent.a $(CC) $(CFLAGS) $(CPPFLAGS) -o $@ $(OBJ) $(LDFLAGS) -install: install.bin #install.man +install: install.bin install.bin: $(TARGET) ${INSTALL} -d @bindir@ @INSTALL_PROGRAM@ $(TARGET) @bindir@ -install.man: - ${INSTALL} -d @mandir@/man1 - @INSTALL_DATA@ $(TARGET).man @mandir@/man1/$(TARGET).1 - -install.man.ja: - ${INSTALL} -d @mandir@/man1 - @INSTALL_DATA@ $(TARGET).man.ja @mandir@/man1/$(TARGET).1 - clean: $(RM) $(OBJ) *~ core $(RM) $(TARGET) $(TARGET).exe From sumomo @ users.sourceforge.jp Thu Oct 2 17:57:02 2008 From: sumomo @ users.sourceforge.jp (sumomo @ users.sourceforge.jp) Date: Thu, 02 Oct 2008 17:57:02 +0900 Subject: [Julius-cvs 295] CVS update: julius4/gramtools Message-ID: <1222937822.246412.29526.nullmailer@users.sourceforge.jp> Index: julius4/gramtools/Makefile.in diff -u julius4/gramtools/Makefile.in:1.2 julius4/gramtools/Makefile.in:1.3 --- julius4/gramtools/Makefile.in:1.2 Tue Dec 18 17:45:46 2007 +++ julius4/gramtools/Makefile.in Thu Oct 2 17:57:02 2008 @@ -4,7 +4,7 @@ # All rights reserved # -# $Id: Makefile.in,v 1.2 2007/12/18 08:45:46 sumomo Exp $ +# $Id: Makefile.in,v 1.3 2008/10/02 08:57:02 sumomo Exp $ # SHELL=/bin/sh RM=@RM@ -f @@ -29,14 +29,6 @@ (cd $$d; $(MAKE) install.bin); \ done -install.man: - for d in $(SUBDIRS); do \ - (cd $$d; $(MAKE) install.man); \ - done - -install.man.ja: - echo nothing to be installed for gramtools. - clean: for d in $(SUBDIRS); do \ (cd $$d; $(MAKE) clean); \ From sumomo @ users.sourceforge.jp Thu Oct 2 17:57:02 2008 From: sumomo @ users.sourceforge.jp (sumomo @ users.sourceforge.jp) Date: Thu, 02 Oct 2008 17:57:02 +0900 Subject: [Julius-cvs 296] CVS update: julius4/gramtools/accept_check Message-ID: <1222937822.390055.29533.nullmailer@users.sourceforge.jp> Index: julius4/gramtools/accept_check/Makefile.in diff -u julius4/gramtools/accept_check/Makefile.in:1.3 julius4/gramtools/accept_check/Makefile.in:1.4 --- julius4/gramtools/accept_check/Makefile.in:1.3 Thu Sep 25 13:49:06 2008 +++ julius4/gramtools/accept_check/Makefile.in Thu Oct 2 17:57:02 2008 @@ -32,20 +32,12 @@ ############################################################ -install: install.bin # install.man install.catman +install: install.bin install.bin: $(TARGET) ${INSTALL} -d @bindir@ @INSTALL_PROGRAM@ $(TARGET) @bindir@ -#install.man: -# ${INSTALL} -d @mandir@/man1 -# @INSTALL_DATA@ $(TARGET).jman @mandir@/man1/adinrec.1 - -#install.catman: -# ${INSTALL} -d @mandir@/cat1 -# @INSTALL_DATA@ $(TARGET).jman.txt @mandir@/cat1/adinrec.1 - ############################################################ clean: From sumomo @ users.sourceforge.jp Thu Oct 2 17:57:02 2008 From: sumomo @ users.sourceforge.jp (sumomo @ users.sourceforge.jp) Date: Thu, 02 Oct 2008 17:57:02 +0900 Subject: [Julius-cvs 297] CVS update: julius4/gramtools/dfa_determinize Message-ID: <1222937822.531024.29541.nullmailer@users.sourceforge.jp> Index: julius4/gramtools/dfa_determinize/Makefile.in diff -u julius4/gramtools/dfa_determinize/Makefile.in:1.3 julius4/gramtools/dfa_determinize/Makefile.in:1.4 --- julius4/gramtools/dfa_determinize/Makefile.in:1.3 Thu Sep 25 13:49:06 2008 +++ julius4/gramtools/dfa_determinize/Makefile.in Thu Oct 2 17:57:02 2008 @@ -31,20 +31,12 @@ ############################################################ -install: install.bin # install.man install.catman +install: install.bin install.bin: $(TARGET) ${INSTALL} -d @bindir@ @INSTALL_PROGRAM@ $(TARGET) @bindir@ -#install.man: -# ${INSTALL} -d @mandir@/man1 -# @INSTALL_DATA@ $(TARGET).jman @mandir@/man1/adinrec.1 - -#install.catman: -# ${INSTALL} -d @mandir@/cat1 -# @INSTALL_DATA@ $(TARGET).jman.txt @mandir@/cat1/adinrec.1 - ############################################################ clean: From sumomo @ users.sourceforge.jp Thu Oct 2 17:57:02 2008 From: sumomo @ users.sourceforge.jp (sumomo @ users.sourceforge.jp) Date: Thu, 02 Oct 2008 17:57:02 +0900 Subject: [Julius-cvs 298] CVS update: julius4/gramtools/dfa_minimize Message-ID: <1222937822.681722.29548.nullmailer@users.sourceforge.jp> Index: julius4/gramtools/dfa_minimize/Makefile.in diff -u julius4/gramtools/dfa_minimize/Makefile.in:1.3 julius4/gramtools/dfa_minimize/Makefile.in:1.4 --- julius4/gramtools/dfa_minimize/Makefile.in:1.3 Thu Sep 25 13:49:06 2008 +++ julius4/gramtools/dfa_minimize/Makefile.in Thu Oct 2 17:57:02 2008 @@ -31,20 +31,12 @@ ############################################################ -install: install.bin # install.man install.catman +install: install.bin install.bin: $(TARGET) ${INSTALL} -d @bindir@ @INSTALL_PROGRAM@ $(TARGET) @bindir@ -#install.man: -# ${INSTALL} -d @mandir@/man1 -# @INSTALL_DATA@ $(TARGET).jman @mandir@/man1/adinrec.1 - -#install.catman: -# ${INSTALL} -d @mandir@/cat1 -# @INSTALL_DATA@ $(TARGET).jman.txt @mandir@/cat1/adinrec.1 - ############################################################ clean: From sumomo @ users.sourceforge.jp Thu Oct 2 17:57:02 2008 From: sumomo @ users.sourceforge.jp (sumomo @ users.sourceforge.jp) Date: Thu, 02 Oct 2008 17:57:02 +0900 Subject: [Julius-cvs 299] CVS update: julius4/gramtools/generate Message-ID: <1222937822.872500.29555.nullmailer@users.sourceforge.jp> Index: julius4/gramtools/generate/Makefile.in diff -u julius4/gramtools/generate/Makefile.in:1.3 julius4/gramtools/generate/Makefile.in:1.4 --- julius4/gramtools/generate/Makefile.in:1.3 Thu Sep 25 13:49:06 2008 +++ julius4/gramtools/generate/Makefile.in Thu Oct 2 17:57:02 2008 @@ -31,20 +31,12 @@ ############################################################ -install: install.bin # install.man install.catman +install: install.bin install.bin: $(TARGET) ${INSTALL} -d @bindir@ @INSTALL_PROGRAM@ $(TARGET) @bindir@ -#install.man: -# ${INSTALL} -d @mandir@/man1 -# @INSTALL_DATA@ $(TARGET).jman @mandir@/man1/adinrec.1 - -#install.catman: -# ${INSTALL} -d @mandir@/cat1 -# @INSTALL_DATA@ $(TARGET).jman.txt @mandir@/cat1/adinrec.1 - ############################################################ clean: From sumomo @ users.sourceforge.jp Thu Oct 2 17:57:03 2008 From: sumomo @ users.sourceforge.jp (sumomo @ users.sourceforge.jp) Date: Thu, 02 Oct 2008 17:57:03 +0900 Subject: [Julius-cvs 300] CVS update: julius4/gramtools/nextword Message-ID: <1222937823.009482.29562.nullmailer@users.sourceforge.jp> Index: julius4/gramtools/nextword/Makefile.in diff -u julius4/gramtools/nextword/Makefile.in:1.3 julius4/gramtools/nextword/Makefile.in:1.4 --- julius4/gramtools/nextword/Makefile.in:1.3 Thu Sep 25 13:49:06 2008 +++ julius4/gramtools/nextword/Makefile.in Thu Oct 2 17:57:02 2008 @@ -32,20 +32,12 @@ ############################################################ -install: install.bin # install.man install.catman +install: install.bin install.bin: $(TARGET) ${INSTALL} -d @bindir@ @INSTALL_PROGRAM@ $(TARGET) @bindir@ -#install.man: -# ${INSTALL} -d @mandir@/man1 -# @INSTALL_DATA@ $(TARGET).jman @mandir@/man1/adinrec.1 - -#install.catman: -# ${INSTALL} -d @mandir@/cat1 -# @INSTALL_DATA@ $(TARGET).jman.txt @mandir@/cat1/adinrec.1 - ############################################################ clean: From sumomo @ users.sourceforge.jp Thu Oct 2 17:57:03 2008 From: sumomo @ users.sourceforge.jp (sumomo @ users.sourceforge.jp) Date: Thu, 02 Oct 2008 17:57:03 +0900 Subject: [Julius-cvs 301] CVS update: julius4/jclient-perl Message-ID: <1222937823.146465.29570.nullmailer@users.sourceforge.jp> Index: julius4/jclient-perl/Makefile.in diff -u /dev/null julius4/jclient-perl/Makefile.in:1.1 --- /dev/null Thu Oct 2 17:57:03 2008 +++ julius4/jclient-perl/Makefile.in Thu Oct 2 17:57:03 2008 @@ -0,0 +1,27 @@ +# Copyright (c) 1991-2007 Kawahara Lab., Kyoto University +# Copyright (c) 2000-2005 Shikano Lab., Nara Institute of Science and Technology +# Copyright (c) 2005-2007 Julius project team, Nagoya Institute of Technology +# All rights reserved + +SHELL=/bin/sh +RM=@RM@ -f +prefix=@prefix@ +exec_prefix=@exec_prefix@ +INSTALL=@INSTALL@ + +TARGET=jclient.pl + +all: + chmod +x $(TARGET) + +install: install.bin + +install.bin: + ${INSTALL} -d @bindir@ + @INSTALL_PROGRAM@ $(TARGET) @bindir@ + +clean: + echo nothing to do + +distclean: + $(RM) Makefile From sumomo @ users.sourceforge.jp Thu Oct 2 17:57:03 2008 From: sumomo @ users.sourceforge.jp (sumomo @ users.sourceforge.jp) Date: Thu, 02 Oct 2008 17:57:03 +0900 Subject: [Julius-cvs 302] CVS update: julius4/jcontrol Message-ID: <1222937823.302169.29578.nullmailer@users.sourceforge.jp> Index: julius4/jcontrol/Makefile.in diff -u julius4/jcontrol/Makefile.in:1.2 julius4/jcontrol/Makefile.in:1.3 --- julius4/jcontrol/Makefile.in:1.2 Tue Dec 18 17:45:48 2007 +++ julius4/jcontrol/Makefile.in Thu Oct 2 17:57:03 2008 @@ -3,7 +3,7 @@ # Copyright (c) 2005-2007 Julius project team, Nagoya Institute of Technology # All rights reserved # -# $Id: Makefile.in,v 1.2 2007/12/18 08:45:48 sumomo Exp $ +# $Id: Makefile.in,v 1.3 2008/10/02 08:57:03 sumomo Exp $ # SHELL=/bin/sh .SUFFIXES: @@ -28,20 +28,12 @@ $(TARGET): $(OBJ) $(CC) $(CFLAGS) $(CPPFLAGS) -o $@ $(OBJ) $(LDFLAGS) -install: install.bin install.man +install: install.bin install.bin: $(TARGET) ${INSTALL} -d @bindir@ @INSTALL_PROGRAM@ $(TARGET) @bindir@ -install.man: - ${INSTALL} -d @mandir@/man1 - @INSTALL_DATA@ $(TARGET).man @mandir@/man1/$(TARGET).1 - -install.man.ja: - ${INSTALL} -d @mandir@/man1 - @INSTALL_DATA@ $(TARGET).man.ja @mandir@/man1/$(TARGET).1 - clean: $(RM) $(OBJ) $(RM) config.log config.cache From sumomo @ users.sourceforge.jp Thu Oct 2 17:57:03 2008 From: sumomo @ users.sourceforge.jp (sumomo @ users.sourceforge.jp) Date: Thu, 02 Oct 2008 17:57:03 +0900 Subject: [Julius-cvs 303] CVS update: julius4/julius Message-ID: <1222937823.477216.29589.nullmailer@users.sourceforge.jp> Index: julius4/julius/Makefile.in diff -u julius4/julius/Makefile.in:1.4 julius4/julius/Makefile.in:1.5 --- julius4/julius/Makefile.in:1.4 Thu Sep 25 13:49:05 2008 +++ julius4/julius/Makefile.in Thu Oct 2 17:57:03 2008 @@ -5,7 +5,7 @@ # All rights reserved # -# $Id: Makefile.in,v 1.4 2008/09/25 04:49:05 sumomo Exp $ +# $Id: Makefile.in,v 1.5 2008/10/02 08:57:03 sumomo Exp $ # SHELL=/bin/sh .SUFFIXES: @@ -58,20 +58,12 @@ ############################################################ -install: install.bin install.man +install: install.bin install.bin: $(TARGET) ${INSTALL} -d @bindir@ ${INSTALL_PROGRAM} $(TARGET) ${bindir}/${INSTALLTARGET} -install.man: - ${INSTALL} -d @mandir@/man1 - ${INSTALL_DATA} $(TARGET).man ${mandir}/man1/$(TARGET).1 - -install.man.ja: - ${INSTALL} -d @mandir@/man1 - ${INSTALL_DATA} $(TARGET).man.ja ${mandir}/man1/$(TARGET).1 - depend: makedepend -- $(CFLAGS) -- $(OBJSENT) Index: julius4/julius/configure diff -u julius4/julius/configure:1.1.1.1 julius4/julius/configure:1.2 --- julius4/julius/configure:1.1.1.1 Fri Sep 28 11:50:55 2007 +++ julius4/julius/configure Thu Oct 2 17:57:03 2008 @@ -465,7 +465,7 @@ # A filename unique to this package, relative to the directory that # configure is in, which we can look for to find out if srcdir is correct. -ac_unique_file=julius.man +ac_unique_file=main.c # Find the source files, if location was not specified. if test -z "$srcdir"; then Index: julius4/julius/configure.in diff -u julius4/julius/configure.in:1.2 julius4/julius/configure.in:1.3 --- julius4/julius/configure.in:1.2 Tue Dec 18 17:45:48 2007 +++ julius4/julius/configure.in Thu Oct 2 17:57:03 2008 @@ -4,10 +4,10 @@ dnl Copyright (c) 2005-2007 Julius project team, Nagoya Institute of Technology dnl All rights reserved dnl -dnl $Id: configure.in,v 1.2 2007/12/18 08:45:48 sumomo Exp $ +dnl $Id: configure.in,v 1.3 2008/10/02 08:57:03 sumomo Exp $ dnl -AC_INIT(julius.man) +AC_INIT(main.c) AC_CONFIG_HEADER(config.h) AC_CONFIG_AUX_DIR(../support) From sumomo @ users.sourceforge.jp Thu Oct 2 17:57:03 2008 From: sumomo @ users.sourceforge.jp (sumomo @ users.sourceforge.jp) Date: Thu, 02 Oct 2008 17:57:03 +0900 Subject: [Julius-cvs 304] CVS update: julius4/libjulius Message-ID: <1222937823.636094.29596.nullmailer@users.sourceforge.jp> Index: julius4/libjulius/Makefile.in diff -u julius4/libjulius/Makefile.in:1.4 julius4/libjulius/Makefile.in:1.5 --- julius4/libjulius/Makefile.in:1.4 Thu Sep 25 14:00:04 2008 +++ julius4/libjulius/Makefile.in Thu Oct 2 17:57:03 2008 @@ -5,7 +5,7 @@ # All rights reserved # -# $Id: Makefile.in,v 1.4 2008/09/25 05:00:04 sumomo Exp $ +# $Id: Makefile.in,v 1.5 2008/10/02 08:57:03 sumomo Exp $ # SHELL=/bin/sh .SUFFIXES: @@ -101,12 +101,6 @@ ${INSTALL} -d ${bindir} ${INSTALL_PROGRAM} libjulius-config ${bindir} -install.man: - echo nothing to be installed for libjulius. - -install.man.ja: - echo nothing to be installed for libjulius. - depend: makedepend -- $(CFLAGS) -- $(OBJSENT) From sumomo @ users.sourceforge.jp Thu Oct 2 17:57:03 2008 From: sumomo @ users.sourceforge.jp (sumomo @ users.sourceforge.jp) Date: Thu, 02 Oct 2008 17:57:03 +0900 Subject: [Julius-cvs 305] CVS update: julius4/libsent Message-ID: <1222937823.775460.29604.nullmailer@users.sourceforge.jp> Index: julius4/libsent/Makefile.in diff -u julius4/libsent/Makefile.in:1.6 julius4/libsent/Makefile.in:1.7 --- julius4/libsent/Makefile.in:1.6 Tue Sep 30 12:58:17 2008 +++ julius4/libsent/Makefile.in Thu Oct 2 17:57:03 2008 @@ -3,7 +3,7 @@ # Copyright (c) 2005-2007 Julius project team, Nagoya Institute of Technology # All rights reserved # -# $Id: Makefile.in,v 1.6 2008/09/30 03:58:17 sumomo Exp $ +# $Id: Makefile.in,v 1.7 2008/10/02 08:57:03 sumomo Exp $ # SHELL=/bin/sh @@ -155,9 +155,6 @@ ${INSTALL} -d ${bindir} ${INSTALL_PROGRAM} libsent-config ${bindir} -install.man.ja: - echo nothing to be installed for libsent. - clean: $(RM) *~ src/*/*~ src/*/*.o src/*/*/*.o include/sent/*~ $(RM) config.log config.cache From sumomo @ users.sourceforge.jp Thu Oct 2 17:57:03 2008 From: sumomo @ users.sourceforge.jp (sumomo @ users.sourceforge.jp) Date: Thu, 02 Oct 2008 17:57:03 +0900 Subject: [Julius-cvs 306] CVS update: julius4/man Message-ID: <1222937823.920586.29612.nullmailer@users.sourceforge.jp> Index: julius4/man/Makefile.in diff -u /dev/null julius4/man/Makefile.in:1.1 --- /dev/null Thu Oct 2 17:57:03 2008 +++ julius4/man/Makefile.in Thu Oct 2 17:57:03 2008 @@ -0,0 +1,36 @@ +# Copyright (c) 1991-2007 Kawahara Lab., Kyoto University +# Copyright (c) 2001-2005 Shikano Lab., Nara Institute of Science and Technology +# Copyright (c) 2005-2007 Julius project team, Nagoya Institute of Technology +# All rights reserved +# +# $Id: Makefile.in,v 1.1 2008/10/02 08:57:03 sumomo Exp $ +# +SHELL=/bin/sh +RM=@RM@ -f +prefix=@prefix@ +exec_prefix=@exec_prefix@ +INSTALL=@INSTALL@ + +############################################################ + +install.man: + ${INSTALL} -d @mandir@/man1 + for f in *.1; do \ + @INSTALL_DATA@ $$f @mandir@/man1/$$f; \ + done + +install.man.ja: + ${INSTALL} -d @mandir@/man1/ja + cd ja; + for f in *.1; do \ + @INSTALL_DATA@ $$f @mandir@/man1/ja/$$f; \ + done + cd .. + +############################################################ + +clean: + echo nothing to do + +distclean: + $(RM) Makefile From sumomo @ users.sourceforge.jp Thu Oct 2 17:57:04 2008 From: sumomo @ users.sourceforge.jp (sumomo @ users.sourceforge.jp) Date: Thu, 02 Oct 2008 17:57:04 +0900 Subject: [Julius-cvs 307] CVS update: julius4/mkbingram Message-ID: <1222937824.059592.29619.nullmailer@users.sourceforge.jp> Index: julius4/mkbingram/Makefile.in diff -u julius4/mkbingram/Makefile.in:1.3 julius4/mkbingram/Makefile.in:1.4 --- julius4/mkbingram/Makefile.in:1.3 Thu Sep 25 13:49:05 2008 +++ julius4/mkbingram/Makefile.in Thu Oct 2 17:57:03 2008 @@ -3,7 +3,7 @@ # Copyright (c) 2005-2007 Julius project team, Nagoya Institute of Technology # All rights reserved # -# $Id: Makefile.in,v 1.3 2008/09/25 04:49:05 sumomo Exp $ +# $Id: Makefile.in,v 1.4 2008/10/02 08:57:03 sumomo Exp $ # SHELL=/bin/sh .SUFFIXES: @@ -29,20 +29,12 @@ $(TARGET): $(OBJ) $(LIBSENT)/libsent.a $(CC) $(CFLAGS) $(CPPFLAGS) -o $@ $(OBJ) $(LDFLAGS) -install: install.bin install.man +install: install.bin install.bin: $(TARGET) ${INSTALL} -d @bindir@ @INSTALL_PROGRAM@ $(TARGET) @bindir@ -install.man: - ${INSTALL} -d @mandir@/man1 - @INSTALL_DATA@ $(TARGET).man @mandir@/man1/$(TARGET).1 - -install.man.ja: - ${INSTALL} -d @mandir@/man1 - @INSTALL_DATA@ $(TARGET).man.ja @mandir@/man1/$(TARGET).1 - clean: $(RM) $(OBJ) $(RM) *~ core From sumomo @ users.sourceforge.jp Thu Oct 2 17:57:04 2008 From: sumomo @ users.sourceforge.jp (sumomo @ users.sourceforge.jp) Date: Thu, 02 Oct 2008 17:57:04 +0900 Subject: [Julius-cvs 308] CVS update: julius4/mkbinhmm Message-ID: <1222937824.226030.29626.nullmailer@users.sourceforge.jp> Index: julius4/mkbinhmm/Makefile.in diff -u julius4/mkbinhmm/Makefile.in:1.4 julius4/mkbinhmm/Makefile.in:1.5 --- julius4/mkbinhmm/Makefile.in:1.4 Tue Sep 30 12:58:18 2008 +++ julius4/mkbinhmm/Makefile.in Thu Oct 2 17:57:04 2008 @@ -3,7 +3,7 @@ # Copyright (c) 2005-2007 Julius project team, Nagoya Institute of Technology # All rights reserved # -# $Id: Makefile.in,v 1.4 2008/09/30 03:58:18 sumomo Exp $ +# $Id: Makefile.in,v 1.5 2008/10/02 08:57:04 sumomo Exp $ # SHELL=/bin/sh .SUFFIXES: @@ -29,22 +29,12 @@ mkbinhmmlist: mkbinhmmlist.o $(LIBSENT)/libsent.a $(CC) $(CFLAGS) $(CPPFLAGS) -o $@ mkbinhmmlist.o $(LDFLAGS) -install: install.bin install.man +install: install.bin install.bin: mkbinhmm mkbinhmmlist ${INSTALL} -d @bindir@ @INSTALL_PROGRAM@ mkbinhmm mkbinhmmlist @bindir@ -install.man: - ${INSTALL} -d @mandir@/man1 - @INSTALL_DATA@ mkbinhmm.man @mandir@/man1/mkbinhmm.1 - @INSTALL_DATA@ mkbinhmmlist.man @mandir@/man1/mkbinhmmlist.1 - -install.man.ja: - ${INSTALL} -d @mandir@/man1 - @INSTALL_DATA@ mkbinhmm.man.ja @mandir@/man1/mkbinhmm.1 - @INSTALL_DATA@ mkbinhmmlist.man.ja @mandir@/man1/mkbinhmmlist.1 - clean: $(RM) mkbinhmm.o mkbinhmmlist.o $(RM) *~ core From sumomo @ users.sourceforge.jp Thu Oct 2 17:57:04 2008 From: sumomo @ users.sourceforge.jp (sumomo @ users.sourceforge.jp) Date: Thu, 02 Oct 2008 17:57:04 +0900 Subject: [Julius-cvs 309] CVS update: julius4/mkgshmm Message-ID: <1222937824.386685.29633.nullmailer@users.sourceforge.jp> Index: julius4/mkgshmm/Makefile.in diff -u julius4/mkgshmm/Makefile.in:1.2 julius4/mkgshmm/Makefile.in:1.3 --- julius4/mkgshmm/Makefile.in:1.2 Tue Dec 18 17:45:55 2007 +++ julius4/mkgshmm/Makefile.in Thu Oct 2 17:57:04 2008 @@ -20,20 +20,12 @@ ############################################################ -install: install.bin install.man +install: install.bin install.bin: $(TARGET) ${INSTALL} -d @bindir@ @INSTALL_PROGRAM@ $(TARGET) @bindir@ -install.man: - ${INSTALL} -d @mandir@/man1 - @INSTALL_DATA@ $(TARGET).man @mandir@/man1/$(TARGET).1 - -install.man.ja: - ${INSTALL} -d @mandir@/man1 - @INSTALL_DATA@ $(TARGET).man.ja @mandir@/man1/$(TARGET).1 - ############################################################ clean: From sumomo @ users.sourceforge.jp Thu Oct 2 17:57:04 2008 From: sumomo @ users.sourceforge.jp (sumomo @ users.sourceforge.jp) Date: Thu, 02 Oct 2008 17:57:04 +0900 Subject: [Julius-cvs 310] CVS update: julius4/mkss Message-ID: <1222937824.539125.29640.nullmailer@users.sourceforge.jp> Index: julius4/mkss/Makefile.in diff -u julius4/mkss/Makefile.in:1.3 julius4/mkss/Makefile.in:1.4 --- julius4/mkss/Makefile.in:1.3 Thu Sep 25 13:49:06 2008 +++ julius4/mkss/Makefile.in Thu Oct 2 17:57:04 2008 @@ -3,7 +3,7 @@ # Copyright (c) 2005-2007 Julius project team, Nagoya Institute of Technology # All rights reserved # -# $Id: Makefile.in,v 1.3 2008/09/25 04:49:06 sumomo Exp $ +# $Id: Makefile.in,v 1.4 2008/10/02 08:57:04 sumomo Exp $ # SHELL=/bin/sh .SUFFIXES: @@ -33,20 +33,12 @@ ############################################################ -install: install.bin install.man +install: install.bin install.bin: $(TARGET) ${INSTALL} -d @bindir@ @INSTALL_PROGRAM@ $(TARGET) @bindir@ -install.man: - ${INSTALL} -d @mandir@/man1 - @INSTALL_DATA@ mkss.man @mandir@/man1/mkss.1 - -install.man.ja: - ${INSTALL} -d @mandir@/man1 - @INSTALL_DATA@ mkss.man.ja @mandir@/man1/mkss.1 - ############################################################ clean: From sumomo @ users.sourceforge.jp Thu Oct 2 17:23:45 2008 From: sumomo @ users.sourceforge.jp (sumomo @ users.sourceforge.jp) Date: Thu, 02 Oct 2008 17:23:45 +0900 Subject: [Julius-cvs 311] CVS update: julius4/adintool Message-ID: <1222935825.596016.32218.nullmailer@users.sourceforge.jp> Index: julius4/adintool/00readme-ja.txt diff -u julius4/adintool/00readme-ja.txt:1.2 julius4/adintool/00readme-ja.txt:1.3 --- julius4/adintool/00readme-ja.txt:1.2 Tue Dec 18 23:08:21 2007 +++ julius4/adintool/00readme-ja.txt Thu Oct 2 17:23:45 2008 @@ -1,206 +1,214 @@ + adintool + ADINTOOL(1) ADINTOOL(1) -NAME - adintool - audio tool to record/split/send/receive speech data for - Julius +?? + adintool + - ?????????????????????? -SYNOPSIS - adintool -in inputdev -out outputdev [options...] +?? + adintool {-in inputdev} {-out outputdev} [options...] DESCRIPTION - adintool ?????????????????????L?????? ? ? - ?? ?????????????????????????????????+ adintool ?????????????????????L??????? ? + ????????????????????????????????? ?? ???????????????????D adintool ? adinrec ???????????????????????? ? - ?? ? ????????????E????????(adinnet ?????? - ?)?????????????????C???????????o???? - ? ?????adinnet ?????????)??????????????? - ???iadinnet ????????????? julius ????????? ? - ??????????ッ??????????? - - ? ???????????ゥ??????????????D??????? - ????adinrec ??????????????????????????? - ? ???????????????????????J??????????- ????????I?????C???????????????????? - ???? - - ?????????????????????ョ? 16bit monoral ?????- ????f???ョ? WAV, 16bit, ??????????????????? - ?????????????D - -INPUT - ????????????????????????????? - - -in mic - ????????????? - - -in file - ??????????ョ? RAW (16bit big endian)?WAV(????? - ??????????????? - ?????????????????????????????? - - -in adinnet - adinnet ????????????????? adinnet ????? ? - ? ???????????? adinnet ?????????TCP/IP?? - ????????????? adinnet ????????????? ? - ????? - ?? ? ????????? 5530 ???????????? "-port" - ?????? - - -in netaudio - (?????????????????Netaudio/DatLink????? ? - ? ??????????????????? "-NA host:unit" ??? - ???????? - - -in stdin - ????D??????ョ? RAW, WAV ??? - -OUTPUT - ???????????f?????o???f???????????? ? - ????????? - - -out file - ?? ? ? ? ????D??t????????????"-filename - foobar" ???????タ??? "foobar.0000" , "foobar.0001" ... - ? ???????????????????4??ID???????? - ?????? ID ? 0 ???l?????????????P?? ? - ?? ????????? "-startid" ??????????????- ?????ョ? 16bit WAV ?ョ???? RAW ?ョ???? ? ? ? - "-raw" ??????????? - - -out adinnet - adinnet ???????????????????? adinnet ??? - ??????????????????? adintool ? adinnet ? ? - ? ? ? ? ????adinnet ?????????????????? - ??adinnet ????????? adintool ??? Julius ?adinnet - ????????? - "-server" ?????adinnet?????????????????? - ?????????? 5530 ???????????? "-port" ? ? - ???? - - -out stdout - ? ????o?????ョ? RAW, 16bit signed (big endian) ?? - ?? - + ?? ?????????????E????????(adinnet ???? ?? + ?)????????Julius ? -input ?????? ??????????? + ?????????? + + ??????C???????????o??????????adinnet ? + ????????)??????????????????iadinnet ??? + ?????????? julius ????????????????????ッ + ??????????? + + ????????????ゥ??????????????D?????? ? + ????adinrec ????????????????????????? ? + ?????????????????????????J????????? + ?????????I?????C??????????????????? + ????? + + ???????????????????????ョ? 16bit, 1 channel + ????o????????ョ? Microsoft WAV ?ョ??? ??????? + ???????????????????D OPTIONS - -server host[,host...] - "-out adinnet" ??????????????????????? ? - ?????????????? - - -port num[,host...] - "-out adinnet" ???????????????????????? - ??????? "-server"???????????????? ? ?? - (default: 5530) - - -nosegment - ????????????????s???????????_??? - ?????????????C?????????4??ID???? ? - ????? - - -oneshot - ???????????P???????????????D - - -freq threshold - ????????????? Hz (default: 16000) - - -48 48kHz????????16kHz????????????? - - -lv threslevel - ????????????? (0 - 32767)?(default: 2000)? - - -zc zerocrossnum - ??????????????? (default: 60) - - -headmargin msec - ?????????????????????? (default: 400) - - -tailmargin msec - ???????????}?????????? (default: 400) - - -nostrip - ? ?? 0 ?????ゥ????s???????????????ゥ - ????s?? - - -zmean DC?????s?? + Julius ????????????????????????????? ?? + ???????????????????????adintool ? ?????? + ?????? Julius ??????????? + + adintool specific options + -freq Hz + ???????????? (Hz) ??????(default: 16,000) + + -in inputdev + ???????????????????"mic" ??????? "file" ? + ??????, "stdin" ??????????????D ??????? + ??C??????????????v?????? ???????? + ??"adinnet" ? adintool ? adinnet ???? ????adinnet ??? + ??????????? tcp/ip ??? ??????????? 5530 ? + ???"-inport" ??????? + + ???????????? Julius ? "-input" ??????????? + ????????C????????????????? + + -out outputdev + ???????f?????????"file" ???????C stdout ? + ??o??????D???????C??t????? ????? + "-filename" ???????t??? ?ョ? 16bit WAV ?ョ???? ? + ??"adinnet" ? adintool ? adinnet ?????? ????adinnet + ??????????????? tcp/ip ??? ??????????? + ?? "-server" ?????? ?????? 5530 ????"-port" ??? + ???? + + -inport num + ??? adinnet ???(-in adinnet)???????????? ???? + ??????????f????? 5530 ???? + + -server [host] [,host...] + ???adinnet ???(-out adinnet)??????????????? + ???????C????????????? + + -port [num] [,num...] + ???adinnet ???(-out adinnet)??????????????? + ??????????????f????? 5530 ???? -server ?? + ??????????????C ???????ヲ?????????? + ???????? + + -filename file + ??????(-out file) ????t????? ?????????? + ????????????o???? "file.0000.wav" , "file.0001.wav" + ... ???????????? ???????????l? 0 ??? + ?-startid? ?????????????? -oneshot ???? ????+ ???? "file" ?????????? + + -startid number + ???????C??????????????l??????? ??? + ???0? + + -oneshot + ????????I????????D + + -nosegment + ???????????i???????????????????? ? + ???? + + -raw + RAW?????ョ?????D + + -autopause + ???adinnet ???i-out adinnet???????????????? + ???????????s???????adinnet ???? ?????? + ??????????????? + + -loosesync + ???adinnet ?-out adinnet????????T??????????+ ?????????????J???????????????adintool + ? ?????????????????????????????? ?? + ?????????????????P??????????? ???? + ????????????? + + -rewind msec + ????????????????????J?????????? ?? + ????????????C????????????????? ??? + ????? + + Concerning Julius options + -input {mic|rawfile|adinnet|stdin|netaudio|esd|alsa|oss} + ?????????????"-in" ?????????????? ??? + ??????????????????esd ????????? ???? + ???? + + -lv thres + ????????????? 0 ?? 32767 ????????? (default: + 2000) + + -zc thres + ??????????????????????????? (default: 60) + + -headmargin msec + ???????????????????? (default: 300) + + -tailmargin msec + ????????}??????????? (default: 400) + + -zmean + ????????????????????s???????????? + ?????????D + + -smpFreq Hz + ???????????? (Hz) ??????(default: 16,000) + + -48 + 48kHz???????16kHz????????????? ??? 16kHz ?? + ??????????????????? ?????????????? + ? sptk ?? ?????? (Rev. 4.0) + + -NA devicename + DatLink ????????? (-input netaudio). + + -adport port_number + + -input adinnet ???????????? adinnet ?????????? + ??(default: 5530) + + -nostrip + ??????????????????????????????? ? + "0" ??????????????????Julius ???C?? ???? + ?????????????????D??????????????? + ????C???????????????ゥ???????????? + ???? + + -C jconffile + jconf?????????????????????????W????? + + -plugindir dirlist + ????????????????????????????????? + ??????????? + +ENVIRONMENT VARIABLES + ALSADEV + (?????? alsa ???????) ????????????? ??? + ?????"default"? + + AUDIODEV + (?????? oss ???????) ????????????? ??? + ?????"/dev/dsp"? + + LATENCY_MSEC + Linux (alsa/oss) ??? Windows ??????????????? ?? + ????????????????????????????????CPU + ????????????????????????OS? ??????? + ?????????????OS ????????? ?????????? + ???????????? - -raw ??????`ョ? RAW, 16bit signed (big endian) ??????? - ??? WAV ?ョ???? - - -autopause - ?????????I? pause ?????D - - -loosesync - ? ???????????????? pause ? resume ?????? - ?????????????????? - - -rewind msec - ??Cadintool ? pause ???????????????pause? ? - ? ? ? ? ? ? ???????????O??????????? - resume ???????????????????????????? - ??????????????????resume??????????C - ??? resume ???????????????????? - -EXAMPLE +EXAMPLES ????????????????? "data.0000.wav" ????L???? - - % adintool -in mic -out file -filename data - - ??????????? "foobar.raw"??????? ? "foobar.1500.wav" - "foobar.1501.wav" ... ?????? - - % adintool -in file -out file -filename foobar - -startid 1500 - (????????????????????) - enter filename->foobar.raw - + ??????????? "foobar.raw" ????????? + "foobar.1500.wav" "foobar.1501.wav" ... ?????? ????????????????????(??????? - - [???] - % adintool -in adinnet -out file -nosegment - [???] - % adintool -in file -out adinnet -server hostname - -nosegment - - ????????????????? Julius ???? - - (1) ????????????Julius??????E?ッ? - - [Julius] - % julius -C xxx.jconf ... -input adinnet - [adintool] - % adintool -in mic -out adinnet -server hostname - -nosegment - - (2) ????????????(adintool)???????C????????- ???Julius ?????ッ? - - [Julius] - % julius -C xxx.jconf ... -input adinnet - [adintool] - % adintool -in mic -out adinnet -server hostname + ??????????? Julius ??????ッ? SEE ALSO - julius(1), adinrec(1) - -BUGS - ??????????????? ? ? ? julius-info at lists.source- - forge.jp ????????? + julius ( 1 ) , + adinrec ( 1 ) COPYRIGHT - Copyright (c) 1991-2006 ???? ????コ - Copyright (c) 2000-2005 ?????????w??? ュ???コ - Copyright (c) 2005-2006 ??????? Julius????? + Copyright (c) 1991-2008 ???? ????コ + + Copyright (c) 1997-2000 ????U?????(IPA) + + Copyright (c) 2000-2008 ?????????w??? ュ???コ -AUTHORS - ? ?? (???????) ?タ?????? + Copyright (c) 2005-2008 ??????? Julius????? LICENSE Julius ??????????D -4.3 Berkeley Distribution LOCAL ADINTOOL(1) + 10/02/2008 ADINTOOL(1) Index: julius4/adintool/00readme.txt diff -u julius4/adintool/00readme.txt:1.2 julius4/adintool/00readme.txt:1.3 --- julius4/adintool/00readme.txt:1.2 Tue Dec 18 23:08:21 2007 +++ julius4/adintool/00readme.txt Thu Oct 2 17:23:45 2008 @@ -1,206 +1,214 @@ + adintool + ADINTOOL(1) ADINTOOL(1) NAME - adintool - audio tool to record/split/send/receive speech data for - Julius + adintool + - a tool to record / split / send / receive audio streams SYNOPSIS - adintool -in inputdev -out outputdev [options...] + adintool {-in inputdev} {-out outputdev} [options...] DESCRIPTION adintool analyzes speech input, finds speech segments skipping silence, - and records the detected segments in various ways. It performs speech - detection based on zerocross number and power (level), and records the + and records the detected segments in various ways. It performs speech + detection based on zerocross number and power (level), and records the detected parts to files or other output devices sucessively. - adintool is a highly-functioned version of adinrec. The supported - input device are: microphone input, a speech file, standard tty input, - and network socket (called adin-net server mode). The speech segments - are saved to output devices: speech files, standard tty output, and - network socket (called adin-net client mode). For example, you can - record the incoming speech segments to files with successively-numbered - suffixes, or send them to speech recognition engine julius to recognize - them. - - The output is not buffered: the receiver can get speech data with only - a slight delay after a speech starts. The speech detection algorithm - is as same as that of adinrec. - - Output format is WAV, 16bit (signed short), monoral. If the file - already exist, it will be overridden. - -INPUT - The input device should be specified by one of the following options: - - -in mic - Microphone input (default) - -in file - Speech data file. Supported format is RAW (16bit big endian) - and WAV (no compression) etc (depending on the compilation time - setting). - The input file name should be given later: prompt will appear - after startup. - - -in adinnet - Make adintool "adinnet server", waiting for connection from - adinnet client and receiving speech data from there via tcp/ip - socket. - Default port number is 5530, which can be altered by option - "-port". - - -in netaudio - If supported, get input data from NetAudio/Datlink server. Host - and unit name should be given with "-NA host:unit" option. - - -in stdin - Read speech data from standard tty input. Only RAW and WAV for- - mat is supported. - -OUTPUT - Specify one of these below to select an output device which the - detected speech segments are going to written to. - - -out file - Output to files. The base filename should be given by option - like "-filename foobar". Actually, the detected segments are - recorded in separate files such as "foobar.0000", "foobar.0001" - and so on. The four-digit ID begin with 0. This initial value - can be set explicitly by option "-startid". The output format - is WAV, 16bit signed. This can be changed by "-raw" option. - - -out adinnet - Make adintool "adinnet client", making connection to an adinnet - server on a host, and send speech data to the server. The host- - name should be specified by option "-server". The default port - number is 5530, which can be altered by option "-port". The - available adinnet server so far is adintool and Julius. + adintool is a upper version of adinrec with various functions. + Supported input device are: microphone input, a speech file, standard + tty input, and network socket (called adin-net server mode). Julius + plugin can be also used. Detected speech segments will be saved to + output devices: speech files, standard tty output, and network socket + (called adin-net client mode). For example, you can split the incoming + speech to segments and send them to Julius to be recognized. - -out stdout - Output to standard tty output in RAW, 16bit signed (big endian). + Output format is WAV, 16bit (signed short), monoral. If the file + already exist, it will be overridden. OPTIONS - -server host[,host...] - Server(s) to connect with "-out adinnet". With multiple server, - port number for each host should be specified by comma-separated - list. (default: 5530) - - -port num[,host...] - Port number to connect with "-out adinnet". Should be corre- - spond with "-server" - - -nosegment - Re-direct whole input speech data to output device, without - speech detection and segmentation. With this option, the output - filename does not have its four-digit ID appended. - - -oneshot - Record only the first speech segment. - - -freq threshold - Sampling frequency (Hz, default=16000) - - -48 Record in 48kHz, and down sampling to 16kHz. - - -lv threslevel - Level threshold (0-32767, default=2000) - - -zc zerocrossnum - Zero cross number threshold in a second (default=60) - - -headmargin msec - Header margin of each speech segment (unit: milliseconds) - (default: 400) - - -tailmargin msec - Tail margin of each speech segment (unit: milliseconds) - (default: 400) - - -nostrip - Disable skipping of invalid zero samples (default: enabled) - - -zmean Enable zero mean subtraction to remove DC offset. - - -raw Output in RAW (no header) 16bit, big engian format (default: - WAV) - - -autopause - Automatically pause at each input end. - - -loosesync - When connecting to multiple servers, avoid strict synchroniza- - tion for server-side pause and resume command. - - -rewind msec - By default, adintool will ignore speech input while being paused - by server-side command. This may be a problem if an input - begins while paused and then adintool resumes before the input - ends. This option will send the last msec inputs before resum- - ing. - -EXAMPLE - Record microphone input only for the speech-detected part in - "data.0000.wav", "data.0001.wav", ...: - - % adintool -in mic -out file -filename data - - Split a large speech data "foobar.raw" to "foobar.1500.wav", "foo- - bar.1501.wav", etc: - - % adintool -in file -out file -filename foobar - -startid 1500 - (enter the input filename after startup) - enter filename->foobar.raw - .... - - Send whole speech file to other host via tcp/ip socket: - - [sender] - % adintool -in adinnet -out file -nosegment - [receiver] - % adintool -in file -out adinnet -server hostname - -nosegment - - Send microphone input to Julius running on other host: - - (1) Transmit whole input, and let Julius execute - speech detection and recognition: - - [Julius] - % julius -C xxx.jconf ... -input adinnet - [adintool] - % adintool -in mic -out adinnet -server hostname - -nosegment - - (2) Detect speech segment at input client side - (adintool), and transmit only the detected parts - to Julius, and recognize them: - - [Julius] - % julius -C xxx.jconf ... -input adinnet - [adintool] - % adintool -in mic -out adinnet -server hostname + All Julius options can be set. Only audio input related options are + treated and others are silently skipped. Below is a list of options. + adintool specific options + -freq Hz + Set sampling rate in Hz. (default: 16,000) + + -in inputdev + Audio input device. "mic" to capture via microphone input, "file" + for audio file input, and "stdin" to read raw data from + standard-input. For file input, file name prompt will appear after + startup. Use "adinnet" to make adintool as "adinnet server", + receiving data from client via network socket. Default port number + is 5530, which can be altered by option "-inport". + + Alternatively, input device can be set by "-input" option, in which + case you can use plugin input. + + -out outputdev + Audio output device store the data. Specify "file" to save to file, + in which the output filename should be given by "-filename". Use + "stdout" to standard out. "adinnet" will make adintool to be an + adinnet client, sending speech data to a server via tcp/ip socket. + When using "adinnet" output, the server name to send data should be + specified by "-server". The default port number is 5530, which can + be changed by "-port" option. + + -inport num + When adintool becomes adinnet server to receive data (-in adinnet), + set the port number to listen. (default: 5530) + + -server [host] [,host...] + When output to adinnet server (-out adinnet), set the hostname. You + can send to multiple hosts by specifying their hostnames as + comma-delimited list like "host1,host2,host3". + + -port [num] [,num...] + When adintool send a data to adinnet server (-out adinnet), set the + port number to connect. (default: 5530) For multiple servers, + specify port numbers for all servers like "5530,5530,5531". + + -filename file + When output to file (-out file), set the output filename. The actual + file name will be as "file.0000.wav" , "file.0001.wav" and so on, + where the four digit number increases as speech segment detected. + The initial number will be set to 0 by default, which can be changed + by "-startid" option. When using "-oneshot" option to save only the + first segment, the input will be saved as "file". + + -startid number + At file output, set the initial file number. (default: 0) + + -oneshot + Exit after the end of first speech segment. + + -nosegment + Do not perform speech detection for input, just treat all the input + as a single valid segment. + + -raw + Output as RAW file (no header). + + -autopause + When output to adinnet server, adintool enter pause state at every + end of speech segment. It will restart when the destination adinnet + server sends it a resume signal. + + -loosesync + When output to multiple adinnet server, not to do strict + synchronization for restart. By default, when adintool has entered + pause state, it will not restart until resume commands are received + from all servers. This option will allow restart at least one + restart command has arrived. + + -rewind msec + When input is a live microphone device, and there has been some + continuing input at the moment adintool resumes, it start recording + backtracking by the specified milliseconds. + + Concerning Julius options + -input {mic|rawfile|adinnet|stdin|netaudio|esd|alsa|oss} + Choose speech input source. Specify 'file' or 'rawfile' for waveform + file. On file input, users will be prompted to enter the file name + from stdin. + + 'mic' is to get audio input from a default live microphone device, + and 'adinnet' means receiving waveform data via tcpip network from + an adinnet client. 'netaudio' is from DatLink/NetAudio input, and + 'stdin' means data input from standard input. + + At Linux, you can choose API at run time by specifying alsa, oss and + esd. + + -lv thres + Level threshold for speech input detection. Values should be in + range from 0 to 32767. (default: 2000) + + -zc thres + Zero crossing threshold per second. Only input that goes over the + level threshold (-lv) will be counted. (default: 60) + + -headmargin msec + Silence margin at the start of speech segment in milliseconds. + (default: 300) + + -tailmargin msec + Silence margin at the end of speech segment in milliseconds. + (default: 400) + + -zmean + This option enables DC offset removal. + + -smpFreq Hz + Set sampling rate in Hz. (default: 16,000) + + -48 + Record input with 48kHz sampling, and down-sample it to 16kHz + on-the-fly. This option is valid for 16kHz model only. The + down-sampling routine was ported from sptk. (Rev. 4.0) + + -NA devicename + Host name for DatLink server input (-input netaudio). + + -adport port_number + With -input adinnet, specify adinnet port number to listen. + (default: 5530) + + -nostrip + Julius by default removes successive zero samples in input speech + data. This option stop it. + + -C jconffile + Load a jconf file at here. The content of the jconffile will be + expanded at this point. + + -plugindir dirlist + Specify which directories to load plugin. If several direcotries + exist, specify them by colon-separated list. + +ENVIRONMENT VARIABLES + ALSADEV + (using mic input with alsa device) specify a capture device name. If + not specified, "default" will be used. + + AUDIODEV + (using mic input with oss device) specify a capture device path. If + not specified, "/dev/dsp" will be used. + + LATENCY_MSEC + Try to set input latency of microphone input in milliseconds. + Smaller value will shorten latency but sometimes make process + unstable. Default value will depend on the running OS. + +EXAMPLES + Record microphone input to files: "data.0000.wav", "data.0001.wav" and + so on: + Split a long speech file "foobar.raw" into "foobar.1500.wav", + "foobar.1501.wav" ...: + Copy an entire audio file via network socket. + Detect speech segment, send to Julius via network and recognize it: SEE ALSO - julius(1), adinrec(1) + julius ( 1 ) , + adinrec ( 1 ) COPYRIGHT - Copyright (c) 1991-2007 Kawahara Lab., Kyoto University - Copyright (c) 2001-2007 Shikano Lab., Nara Institute of Science and + Copyright (c) 1997-2000 Information-technology Promotion Agency, Japan + + Copyright (c) 1991-2008 Kawahara Lab., Kyoto University + + Copyright (c) 2000-2005 Shikano Lab., Nara Institute of Science and Technology - Copyright (c) 2005-2007 Julius project team, Nagoya Institute of Tech- - nology -AUTHORS - LEE Akinobu (Nagoya Institute of Technology, Japan) - contact: julius-info at lists.sourceforge.jp + Copyright (c) 2005-2008 Julius project team, Nagoya Institute of + Technology LICENSE - Same as Julius. + The same as Julius. -4.3 Berkeley Distribution LOCAL ADINTOOL(1) + 10/02/2008 ADINTOOL(1) Index: julius4/adintool/adintool.man diff -u julius4/adintool/adintool.man:1.2 julius4/adintool/adintool.man:removed --- julius4/adintool/adintool.man:1.2 Tue Dec 18 23:08:21 2007 +++ julius4/adintool/adintool.man Thu Oct 2 17:23:45 2008 @@ -1,193 +0,0 @@ -.de Sp -.if t .sp .5v -.if n .sp -.. -.de Ip -.br -.ie \\n.$>=3 .ne \\$3 -.el .ne 3 -.IP "\\$1" \\$2 -.. -.TH ADINTOOL 1 LOCAL -.UC 6 -.SH NAME -adintool - audio tool to record/split/send/receive speech data for Julius -.SH SYNOPSIS -.B adintool -in inputdev -out outputdev [options...] -.SH DESCRIPTION -.I adintool -analyzes speech input, finds speech segments skipping silence, and -records the detected segments in various ways. It performs speech -detection based on zerocross number and power (level), and records the -detected parts to files or other output devices sucessively. -.PP -.I adintool -is a highly-functioned version of -.I adinrec. -The supported input device are: microphone input, a speech file, -standard tty input, and network socket (called adin-net server mode). -The speech segments are saved to output devices: speech files, -standard tty output, and network socket (called adin-net client mode). -For example, you can record the incoming speech segments to files with -successively-numbered suffixes, or send them to speech recognition -engine -.I julius -to recognize them. -.PP -The output is not buffered: the receiver can get speech data with only -a slight delay after a speech starts. The speech detection algorithm -is as same as that of -.I adinrec. -.PP -Output format is WAV, 16bit (signed short), monoral. -If the file already exist, it will be overridden. -.SH INPUT -The input device should be specified by one of the following options: -.Ip "\-in mic" -Microphone input (default) -.Ip "\-in file" -Speech data file. Supported format is RAW (16bit big endian) and WAV -(no compression) etc (depending on the compilation time setting). -.br -The input file name should be given later: prompt will appear after startup. -.Ip "\-in adinnet" -Make -.I adintool -"adinnet server", waiting for connection from adinnet client and -receiving speech data from there via tcp/ip socket. -.br -Default port number is 5530, which can be altered by option "-port". -.Ip "\-in netaudio" -If supported, get input data from NetAudio/Datlink server. Host and -unit name should be given with "-NA host:unit" option. -.Ip "\-in stdin" -Read speech data from standard tty input. Only RAW and WAV format is -supported. -.SH OUTPUT -Specify one of these below to select an output device which the detected -speech segments are going to written to. -.Ip "\-out file" -Output to files. The base filename should be given by option like -"-filename foobar". Actually, the detected segments are recorded in -separate files such as "foobar.0000", "foobar.0001" and so on. The -four-digit ID begin with 0. This initial value can be set explicitly -by option "-startid". The output format is WAV, 16bit signed. This -can be changed by "-raw" option. -.Ip "\-out adinnet" -Make -.I adintool -"adinnet client", making connection to an adinnet server on a host, -and send speech data to the server. The hostname should be specified -by option "-server". The default port number is 5530, which can be -altered by option "-port". -The available adinnet server so far is -.I adintool -and -.I Julius. -.Ip "\-out stdout" -Output to standard tty output in RAW, 16bit signed (big endian). -.SH OPTIONS -.Ip "\-server host[,host...]" -Server(s) to connect with "-out adinnet". With multiple server, port -number for each host should be specified by comma-separated -list. (default: 5530) -.Ip "\-port num[,host...]" -Port number to connect with "-out adinnet". Should be correspond with "-server" -.Ip "\-nosegment" -Re-direct whole input speech data to output device, without speech -detection and segmentation. With this option, the output filename -does not have its four-digit ID appended. -.Ip "\-oneshot" -Record only the first speech segment. -.Ip "\-freq threshold" -Sampling frequency (Hz, default=16000) -.Ip "\-48" -Record in 48kHz, and down sampling to 16kHz. -.Ip "\-lv threslevel" -Level threshold (0-32767, default=2000) -.Ip "\-zc zerocrossnum" -Zero cross number threshold in a second (default=60) -.Ip "\-headmargin msec" -Header margin of each speech segment (unit: milliseconds) -(default: 400) -.Ip "\-tailmargin msec" -Tail margin of each speech segment (unit: milliseconds) -(default: 400) -.Ip "\-nostrip" -Disable skipping of invalid zero samples (default: enabled) -.Ip "\-zmean" -Enable zero mean subtraction to remove DC offset. -.Ip "\-raw" -Output in RAW (no header) 16bit, big engian format (default: WAV) -.Ip "\-autopause" -Automatically pause at each input end. -.Ip "\-loosesync" -When connecting to multiple servers, avoid strict synchronization -for server-side pause and resume command. -.Ip "\-rewind msec" -By default, adintool will ignore speech input while being paused by -server-side command. This may be a problem if an input begins while -paused and then adintool resumes before the input ends. This option -will send the last msec inputs before resuming. -.SH "EXAMPLE" -Record microphone input only for the speech-detected part in -"data.0000.wav", "data.0001.wav", ...: -.PP - % adintool -in mic -out file -filename data -.PP -Split a large speech data "foobar.raw" to "foobar.1500.wav", "foobar.1501.wav", etc: -.PP - % adintool -in file -out file -filename foobar - -startid 1500 - (enter the input filename after startup) - enter filename->foobar.raw - .... -.PP -Send whole speech file to other host via tcp/ip socket: -.PP - [sender] - % adintool -in adinnet -out file -nosegment -.BR - [receiver] - % adintool -in file -out adinnet -server hostname - -nosegment -.PP -Send microphone input to -.I Julius -running on other host: -.PP -(1) Transmit whole input, and let Julius execute - speech detection and recognition: -.PP - [Julius] - % julius -C xxx.jconf ... -input adinnet -.BR - [adintool] - % adintool -in mic -out adinnet -server hostname - -nosegment -.PP -(2) Detect speech segment at input client side - (adintool), and transmit only the detected parts - to Julius, and recognize them: -.PP - [Julius] - % julius -C xxx.jconf ... -input adinnet -.BR - [adintool] - % adintool -in mic -out adinnet -server hostname - -.SH "SEE ALSO" -julius(1), adinrec(1) -.SH COPYRIGHT -Copyright (c) 1991-2007 Kawahara Lab., Kyoto University -.br -Copyright (c) 2001-2007 Shikano Lab., Nara Institute of Science and Technology -.br -Copyright (c) 2005-2007 Julius project team, Nagoya Institute of Technology -.SH AUTHORS -LEE Akinobu (Nagoya Institute of Technology, Japan) -.br -contact: julius-info at lists.sourceforge.jp -.SH LICENSE -Same as -.I Julius. Index: julius4/adintool/adintool.man.ja diff -u julius4/adintool/adintool.man.ja:1.2 julius4/adintool/adintool.man.ja:removed --- julius4/adintool/adintool.man.ja:1.2 Tue Dec 18 23:08:21 2007 +++ julius4/adintool/adintool.man.ja Thu Oct 2 17:23:45 2008 @@ -1,193 +0,0 @@ -.de Sp -.if t .sp .5v -.if n .sp -.. -.de Ip -.br -.ie \\n.$>=3 .ne \\$3 -.el .ne 3 -.IP "\\$1" \\$2 -.. -.TH ADINTOOL 1 LOCAL -.UC 6 -.SH NAME -adintool - audio tool to record/split/send/receive speech data for Julius -.SH SYNOPSIS -.B adintool -in inputdev -out outputdev [options...] -.SH DESCRIPTION -.I adintool -は,音声波形データ中の音声区間の検出および記録を連続的に行うツールです. -入力音声に対して零交差数と振幅レベルに基づく音声区間検出を逐次行い, -音声区間部分を連続出力します. -.PP -.I adintool -は -.I adinrec -の高機能版です.音声データの入力元として,マイク入力・音声波形ファイル・ -標準入力・ネットワーク入力(adinnet サーバーモード)が選択できます.また, -出力先として,音声波形ファイル・標準出力・ネットワーク出力(adinnet ク -ライアントモード)が選択できます.特にネットワーク出力(adinnet クライ -アントモード)では, -.I julius -へネットワーク経由で音声を送信して音声認識させることができます. -.PP -入力音声は音声区間ごとに自動分割され,逐次出力されます. -音声区間の切り出しには -.I adinrec -と同じ,一定時間内の零交差数とパワー(振幅レベル)のしきい値を用います. -音声区間開始と同時に音声出力が開始されます.出力としてファイル出力を選 -んだ場合は,連番ファイル名で検出された区間ごとに保存します. -.PP -サンプリング周波数は任意に設定可能です.形式は 16bit monoral です.書き出されるデータ形式は WAV, 16bit, モノラルです. -既に同じ名前のファイルが存在する場合は上書きします. -.SH INPUT -音声を読み込む入力デバイスは以下のうちどれかを指定します. -.Ip "\-in mic" -マイク入力(デフォルト). -.Ip "\-in file" -音声波形ファイル.形式は RAW (16bit big endian),WAV(無圧縮)など -(コンパイル時の設定による). -.br -なお,入力ファイル名は起動後に,プロンプトに対して入力する. -.Ip "\-in adinnet" -adinnet サーバーとなってネットワーク経由で adinnet クライアントから音声データを受け取る. -adinnet クライアントからのTCP/IP接続を待ち, -接続が確立した後は adinnet クライアントから音声データを受け取る. -.br -ポート番号のデフォルトは 5530 である.これはオプション "-port" で変更可能. -.Ip "\-in netaudio" -(サポートされていれば)音声データをNetaudio/DatLinkサーバーから受け取 -る.サーバのホスト名とユニット名を "-NA host:unit" で指定する必要があ -る. -.Ip "\-in stdin" -標準入力.音声データ形式は RAW, WAV のみ. -.SH OUTPUT -検出した音声区間の音声データを書き出す出力デバイスとして,以下のうちど -れかを指定します. -.Ip "\-out file" -ファイルへ出力する.出力ファイル名は別のオプション"-filename foobar" -の形で与える.実際には "foobar.0000" , "foobar.0001" ... のように区間ごとに,指 -定した名前の末尾に4桁のIDをつけた名前で記録されなる. ID は 0 -を初期値として,音声区間検出ごとに1増加する.初期値はオプション -"-startid" で変更可能である.また,出力ファイル形式は 16bit WAV 形式である. -RAW 形式で出力するには "-raw" オプションを指定する. -.Ip "\-out adinnet" -adinnet クライアントとなって,ネットワーク経由で adinnet サーバへ音声 -データを送る.入力の時とは逆に, -.I adintool -は adinnet クライアントとなり,adinnet サーバーへ接続後,音声データを -送信する.adinnet サーバーとしては, -.I adintool -および -.I Julius -のadinnet入力が挙げられる. -.br -"-server" で送信先のadinnetサーバのホスト名を指定する.また -ポート番号のデフォルトは 5530 である.これはオプション "-port" で変更可能. -.Ip "\-out stdout" -標準出力へ出力する.形式は RAW, 16bit signed (big endian) である. -.PP -.SH OPTIONS -.Ip "\-server host[,host...]" -"-out adinnet" で送信するサーバのホスト名を指定する.コンマ区切りで -複数のサーバを指定可能. -.Ip "\-port num[,host...]" -"-out adinnet" で送信するサーバのポート番号.複数サーバ使用時は -コンマ区切りで "-server"に対応させて全ての番号を指定すること. (default: 5530) -.Ip "\-nosegment" -入力音声に対して音声区間の検出を行わず,そのまま出力へリダイレクトする. -ファイル出力の場合,ファイル名の末尾に4桁のIDは付与されなくなる. -.Ip "\-oneshot" -入力開始後,一番最初の1音声区間のみを送信後,終了する. -.Ip "\-freq threshold" -サンプリング周波数.単位は Hz (default: 16000) -.Ip "\-48" -48kHzサンプリング後,16kHzにダウンサンプリングする. -.Ip "\-lv threslevel" -波形の振幅レベルのしきい値 (0 - 32767).(default: 2000). -.Ip "\-zc zerocrossnum" -1秒あたりの零交差数のしきい値 (default: 60) -.Ip "\-headmargin msec" -音声区間開始部の直前のマージン.単位はミリ秒 -(default: 400) -.Ip "\-tailmargin msec" -音声区間終了部の直後のマージン.単位はミリ秒 -(default: 400) -.Ip "\-nostrip" -無効な 0 サンプルの自動除去を行わないようにする. -デフォルトは自動除去を行う. -.Ip "\-zmean" -DC成分除去を行う. -.Ip "\-raw" -ファイル出力形式を RAW, 16bit signed (big endian) にする. -デフォルトは WAV 形式である. -.Ip "\-autopause" -入力終了ごとに自動的に pause 状態に入る. -.Ip "\-loosesync" -複数サーバ接続時,複数サーバからの pause や resume コマンドに対して -厳密な同期を行わないようにする. -.Ip "\-rewind msec" -通常,adintool は pause 中の入力を無視する.このため,pause中に入力が開始 -され,その入力が終了する前にサーバコマンドにより resume したときに -極端に短い音声フラグメントが検出されることとなる.このオプションを -指定することで,resume時に音声入力中の場合,入力を resume 時点から -指定した長さだけ遡って送信する. -.SH "EXAMPLE" -マイクからの音声入力を,発話ごとに "data.0000.wav" から順に記録する: -.PP - % adintool -in mic -out file -filename data -.PP -巨大な収録音声ファイル "foobar.raw"を音声区間ごとに -"foobar.1500.wav" "foobar.1501.wav" ... に分割する: -.PP - % adintool -in file -out file -filename foobar - -startid 1500 - (起動後プロンプトに対してファイル名を入力) - enter filename->foobar.raw -.PP -ネットワーク経由で音声ファイルを転送する(区間検出なし): -.PP - [受信側] - % adintool -in adinnet -out file -nosegment -.BR - [送信側] - % adintool -in file -out adinnet -server hostname - -nosegment -.PP -マイクからの入力音声を別サーバーの -.I Julius -に送る: -.PP -(1) 入力データを全て送信し,Julius側で区間検出・認識: -.PP - [Julius] - % julius -C xxx.jconf ... -input adinnet -.BR - [adintool] - % adintool -in mic -out adinnet -server hostname - -nosegment -.PP -(2) 入力データはクライアント(adintool)側で区間検出し,検出した区間だけ -を順に Julius へ送信・認識: -.PP - [Julius] - % julius -C xxx.jconf ... -input adinnet -.BR - [adintool] - % adintool -in mic -out adinnet -server hostname -.SH "SEE ALSO" -julius(1), adinrec(1) -.SH BUGS -バグ報告・問い合わせ・コメントなどは -julius-info at lists.sourceforge.jp までお願いします. -.SH COPYRIGHT -Copyright (c) 1991-2006 京都大学 河原研究室 -.br -Copyright (c) 2000-2005 奈良先端科学技術大学院大学 鹿野研究室 -.br -Copyright (c) 2005-2006 名古屋工業大学 Julius開発チーム -.SH AUTHORS -李 晃伸 (名古屋工業大学) が実装しました. -.SH LICENSE -.I Julius -の使用許諾に準じます. From sumomo @ users.sourceforge.jp Thu Oct 2 17:23:48 2008 From: sumomo @ users.sourceforge.jp (sumomo @ users.sourceforge.jp) Date: Thu, 02 Oct 2008 17:23:48 +0900 Subject: [Julius-cvs 312] CVS update: julius4/man Message-ID: <1222935828.292011.32396.nullmailer@users.sourceforge.jp> Index: julius4/man/accept_check.1 diff -u /dev/null julius4/man/accept_check.1:1.1 --- /dev/null Thu Oct 2 17:23:48 2008 +++ julius4/man/accept_check.1 Thu Oct 2 17:23:47 2008 @@ -0,0 +1,96 @@ +.\" Title: + accept_check + +.\" Author: +.\" Generator: DocBook XSL Stylesheets v1.71.0 +.\" Date: 10/02/2008 +.\" Manual: +.\" Source: +.\" +.TH "ACCEPT_CHECK" "1" "10/02/2008" "" "" +.\" disable hyphenation +.nh +.\" disable justification (adjust text to left margin only) +.ad l +.SH "NAME" + + accept_check + \- Check whether a grammar accept / reject given word sequences +.SH "SYNOPSIS" +.HP 13 +\fBaccept_check\fR [\-t] [\-s\ \fIspname\fR] [\-v] {prefix} +.SH "DESCRIPTION" +.PP + +\fBaccept_check\fR +is a tool to check whether a sentence can be accepted or rejected on a grammar (\fIprefix.dfa\fR +and +\fIprefix.dict\fR). The sentence should be given from standard input. You can do a batch check by preparing all test sentence at each line of a text file, and give it as standard input of +\fBaccept_check\fR. +.PP +This tool needs .dfa, .dict and .term files. You should convert a written grammar file to generate them by +\fBmkdfa.pl\fR. +.PP +A sentence should be given as space\-separated word sequence. It may be required to add head / tail silence word like +sil, depending on your grammar. And should not contain a short\-pause word. +.PP +When a word belongs to various category in a grammar, +\fBaccept_check\fR +will check all the possible sentence patterns, and accept it if any of those is acceptable. +.SH "OPTIONS" +.PP +\fB \-t \fR +.RS 3n +Use category name as input instead of word. +.RE +.PP +\fB \-s \fR \fIspname\fR +.RS 3n +Short\-pause word name to be skipped. (default: "sp") +.RE +.PP +\fB \-v \fR +.RS 3n +Debug output. +.RE +.SH "EXAMPLES" +.PP +An output for "date" grammar: +.sp +.RS 3n +.nf +% echo ' NEXT SUNDAY ' | accept_check date +Reading in dictionary... +143 words...done +Reading in DFA grammar...done +Mapping dict item <\-> DFA terminal (category)...done +Reading in term file (optional)...done +27 categories, 143 words +DFA has 35 nodes and 71 arcs +\-\-\-\-\- +wseq: NEXT SUNDAY +cate: NS_B (NEXT|NEXT) (DAYOFWEEK|DAYOFWEEK|DAY|DAY) NS_E +accepted +.fi +.RE +.sp +.SH "SEE ALSO" +.PP + +\fB mkdfa.pl \fR( 1 ) +, +\fB generate \fR( 1 ) +, +\fB nextword \fR( 1 ) +.SH "COPYRIGHT" +.PP +Copyright (c) 1997\-2000 Information\-technology Promotion Agency, Japan +.PP +Copyright (c) 1991\-2008 Kawahara Lab., Kyoto University +.PP +Copyright (c) 2000\-2005 Shikano Lab., Nara Institute of Science and Technology +.PP +Copyright (c) 2005\-2008 Julius project team, Nagoya Institute of Technology +.SH "LICENSE" +.PP +The same as Julius. Index: julius4/man/adinrec.1 diff -u /dev/null julius4/man/adinrec.1:1.1 --- /dev/null Thu Oct 2 17:23:48 2008 +++ julius4/man/adinrec.1 Thu Oct 2 17:23:47 2008 @@ -0,0 +1,156 @@ +.\" Title: + adinrec + +.\" Author: +.\" Generator: DocBook XSL Stylesheets v1.71.0 +.\" Date: 10/02/2008 +.\" Manual: +.\" Source: +.\" +.TH "ADINREC" "1" "10/02/2008" "" "" +.\" disable hyphenation +.nh +.\" disable justification (adjust text to left margin only) +.ad l +.SH "NAME" + + adinrec + \- record audio device and save one utterance to a file +.SH "SYNOPSIS" +.HP 8 +\fBadinrec\fR [\fIoptions\fR...] {\fIfilename\fR} +.SH "DESCRIPTION" +.PP + +\fBadinrec\fR +opens an audio stream, detects an utterance input and store it to a specified file. The utterance detection is done by level and zero\-cross thresholds. Default input device is microphone, but other audio input source, including Julius A/D\-in plugin, can be used by using "\fB\-input\fR" option. +.PP +The audio format is 16 bit, 1 channel, in Microsoft WAV format. If the given filename already exists, it will be overridden. +.PP +If filename is "\-" , the captured data will be streamed into standard out, with no header (raw format). +.SH "OPTIONS" +.PP + +\fBadinrec\fR +uses JuliusLib and adopts Julius options. Below is a list of valid options. +.SS "adinrec specific options" +.PP +\fB \-freq \fR \fIHz\fR +.RS 3n +Set sampling rate in Hz. (default: 16,000) +.RE +.PP +\fB \-raw \fR +.RS 3n +Output in raw file format. +.RE +.SS "JuliusLib options" +.PP +\fB \-input \fR {mic|rawfile|adinnet|stdin|netaudio|esd|alsa|oss} +.RS 3n +Choose speech input source. Specify 'file' or 'rawfile' for waveform file. On file input, users will be prompted to enter the file name from stdin. +.sp +\'mic' is to get audio input from a default live microphone device, and 'adinnet' means receiving waveform data via tcpip network from an adinnet client. 'netaudio' is from DatLink/NetAudio input, and 'stdin' means data input from standard input. +.sp +At Linux, you can choose API at run time by specifying +alsa, +oss +and +esd. +.RE +.PP +\fB \-lv \fR \fIthres\fR +.RS 3n +Level threshold for speech input detection. Values should be in range from 0 to 32767. (default: 2000) +.RE +.PP +\fB \-zc \fR \fIthres\fR +.RS 3n +Zero crossing threshold per second. Only input that goes over the level threshold (\fB\-lv\fR) will be counted. (default: 60) +.RE +.PP +\fB \-headmargin \fR \fImsec\fR +.RS 3n +Silence margin at the start of speech segment in milliseconds. (default: 300) +.RE +.PP +\fB \-tailmargin \fR \fImsec\fR +.RS 3n +Silence margin at the end of speech segment in milliseconds. (default: 400) +.RE +.PP +\fB \-zmean \fR +.RS 3n +This option enables DC offset removal. +.RE +.PP +\fB \-smpFreq \fR \fIHz\fR +.RS 3n +Set sampling rate in Hz. (default: 16,000) +.RE +.PP +\fB \-48 \fR +.RS 3n +Record input with 48kHz sampling, and down\-sample it to 16kHz on\-the\-fly. This option is valid for 16kHz model only. The down\-sampling routine was ported from +sptk. (Rev. 4.0) +.RE +.PP +\fB \-NA \fR \fIdevicename\fR +.RS 3n +Host name for DatLink server input (\fB\-input netaudio\fR). +.RE +.PP +\fB \-adport \fR \fIport_number\fR +.RS 3n +With +\fB\-input adinnet\fR, specify adinnet port number to listen. (default: 5530) +.RE +.PP +\fB \-nostrip \fR +.RS 3n +Julius by default removes successive zero samples in input speech data. This option stop it. +.RE +.PP +\fB \-C \fR \fIjconffile\fR +.RS 3n +Load a jconf file at here. The content of the jconffile will be expanded at this point. +.RE +.PP +\fB \-plugindir \fR \fIdirlist\fR +.RS 3n +Specify which directories to load plugin. If several direcotries exist, specify them by colon\-separated list. +.RE +.SH "ENVIRONMENT VARIABLES" +.PP +\fB \fR\fB\fBALSADEV\fR\fR\fB \fR +.RS 3n +Device name string for ALSA. (default: "default") +.RE +.PP +\fB \fR\fB\fBAUDIODEV\fR\fR\fB \fR +.RS 3n +Device name string for OSS. (default: "\fI/dev/dsp\fR") +.RE +.PP +\fB \fR\fB\fBLATENCY_MSEC\fR\fR\fB \fR +.RS 3n +Input latency of microphone input in milliseconds. Smaller value will shorten latency but sometimes make process unstable. Default value will depend on the running OS. +.RE +.SH "SEE ALSO" +.PP + +\fB julius \fR( 1 ) +, +\fB adintool \fR( 1 ) +.SH "COPYRIGHT" +.PP +Copyright (c) 1997\-2000 Information\-technology Promotion Agency, Japan +.PP +Copyright (c) 1991\-2008 Kawahara Lab., Kyoto University +.PP +Copyright (c) 2000\-2005 Shikano Lab., Nara Institute of Science and Technology +.PP +Copyright (c) 2005\-2008 Julius project team, Nagoya Institute of Technology +.SH "LICENSE" +.PP +The same as Julius. Index: julius4/man/adintool.1 diff -u /dev/null julius4/man/adintool.1:1.1 --- /dev/null Thu Oct 2 17:23:48 2008 +++ julius4/man/adintool.1 Thu Oct 2 17:23:47 2008 @@ -0,0 +1,238 @@ +.\" Title: + adintool + +.\" Author: +.\" Generator: DocBook XSL Stylesheets v1.71.0 +.\" Date: 10/02/2008 +.\" Manual: +.\" Source: +.\" +.TH "ADINTOOL" "1" "10/02/2008" "" "" +.\" disable hyphenation +.nh +.\" disable justification (adjust text to left margin only) +.ad l +.SH "NAME" + + adintool + \- a tool to record / split / send / receive audio streams +.SH "SYNOPSIS" +.HP 9 +\fBadintool\fR {\-in\ \fIinputdev\fR} {\-out\ \fIoutputdev\fR} [\fIoptions\fR...] +.SH "DESCRIPTION" +.PP + +\fBadintool\fR +analyzes speech input, finds speech segments skipping silence, and records the detected segments in various ways. It performs speech detection based on zerocross number and power (level), and records the detected parts to files or other output devices sucessively. +.PP + +\fBadintool\fR +is a upper version of adinrec with various functions. Supported input device are: microphone input, a speech file, standard tty input, and network socket (called adin\-net server mode). Julius plugin can be also used. Detected speech segments will be saved to output devices: speech files, standard tty output, and network socket (called adin\-net client mode). For example, you can split the incoming speech to segments and send them to Julius to be recognized. +.PP +Output format is WAV, 16bit (signed short), monoral. If the file already exist, it will be overridden. +.SH "OPTIONS" +.PP +All Julius options can be set. Only audio input related options are treated and others are silently skipped. Below is a list of options. +.SS "adintool specific options" +.PP +\fB \-freq \fR \fIHz\fR +.RS 3n +Set sampling rate in Hz. (default: 16,000) +.RE +.PP +\fB \-in \fR \fIinputdev\fR +.RS 3n +Audio input device. "mic" to capture via microphone input, "file" for audio file input, and "stdin" to read raw data from standard\-input. For file input, file name prompt will appear after startup. Use "adinnet" to make +\fBadintool\fR +as "adinnet server", receiving data from client via network socket. Default port number is 5530, which can be altered by option "\fB\-inport\fR". +.sp +Alternatively, input device can be set by "\fB\-input\fR" option, in which case you can use plugin input. +.RE +.PP +\fB \-out \fR \fIoutputdev\fR +.RS 3n +Audio output device store the data. Specify "file" to save to file, in which the output filename should be given by "\fB\-filename\fR". Use "stdout" to standard out. "adinnet" will make +\fBadintool\fR +to be an adinnet client, sending speech data to a server via tcp/ip socket. When using "adinnet" output, the server name to send data should be specified by "\fB\-server\fR". The default port number is 5530, which can be changed by "\fB\-port\fR" option. +.RE +.PP +\fB \-inport \fR \fInum\fR +.RS 3n +When adintool becomes adinnet server to receive data (\-in adinnet), set the port number to listen. (default: 5530) +.RE +.PP +\fB \-server \fR [host] [,host...] +.RS 3n +When output to adinnet server (\-out adinnet), set the hostname. You can send to multiple hosts by specifying their hostnames as comma\-delimited list like "host1,host2,host3". +.RE +.PP +\fB \-port \fR [num] [,num...] +.RS 3n +When adintool send a data to adinnet server (\-out adinnet), set the port number to connect. (default: 5530) For multiple servers, specify port numbers for all servers like "5530,5530,5531". +.RE +.PP +\fB \-filename \fR \fIfile\fR +.RS 3n +When output to file (\fB\-out file\fR), set the output filename. The actual file name will be as "\fIfile.0000.wav\fR" , "\fIfile.0001.wav\fR" and so on, where the four digit number increases as speech segment detected. The initial number will be set to 0 by default, which can be changed by "\fB\-startid\fR" option. When using "\fB\-oneshot\fR" option to save only the first segment, the input will be saved as "\fIfile\fR". +.RE +.PP +\fB \-startid \fR \fInumber\fR +.RS 3n +At file output, set the initial file number. (default: 0) +.RE +.PP +\fB \-oneshot \fR +.RS 3n +Exit after the end of first speech segment. +.RE +.PP +\fB \-nosegment \fR +.RS 3n +Do not perform speech detection for input, just treat all the input as a single valid segment. +.RE +.PP +\fB \-raw \fR +.RS 3n +Output as RAW file (no header). +.RE +.PP +\fB \-autopause \fR +.RS 3n +When output to adinnet server, +\fBadintool\fR +enter pause state at every end of speech segment. It will restart when the destination adinnet server sends it a resume signal. +.RE +.PP +\fB \-loosesync \fR +.RS 3n +When output to multiple adinnet server, not to do strict synchronization for restart. By default, when +\fBadintool\fR +has entered pause state, it will not restart until resume commands are received from all servers. This option will allow restart at least one restart command has arrived. +.RE +.PP +\fB \-rewind \fR \fImsec\fR +.RS 3n +When input is a live microphone device, and there has been some continuing input at the moment +\fBadintool\fR +resumes, it start recording backtracking by the specified milliseconds. +.RE +.SS "Concerning Julius options" +.PP +\fB \-input \fR {mic|rawfile|adinnet|stdin|netaudio|esd|alsa|oss} +.RS 3n +Choose speech input source. Specify 'file' or 'rawfile' for waveform file. On file input, users will be prompted to enter the file name from stdin. +.sp +\'mic' is to get audio input from a default live microphone device, and 'adinnet' means receiving waveform data via tcpip network from an adinnet client. 'netaudio' is from DatLink/NetAudio input, and 'stdin' means data input from standard input. +.sp +At Linux, you can choose API at run time by specifying +alsa, +oss +and +esd. +.RE +.PP +\fB \-lv \fR \fIthres\fR +.RS 3n +Level threshold for speech input detection. Values should be in range from 0 to 32767. (default: 2000) +.RE +.PP +\fB \-zc \fR \fIthres\fR +.RS 3n +Zero crossing threshold per second. Only input that goes over the level threshold (\fB\-lv\fR) will be counted. (default: 60) +.RE +.PP +\fB \-headmargin \fR \fImsec\fR +.RS 3n +Silence margin at the start of speech segment in milliseconds. (default: 300) +.RE +.PP +\fB \-tailmargin \fR \fImsec\fR +.RS 3n +Silence margin at the end of speech segment in milliseconds. (default: 400) +.RE +.PP +\fB \-zmean \fR +.RS 3n +This option enables DC offset removal. +.RE +.PP +\fB \-smpFreq \fR \fIHz\fR +.RS 3n +Set sampling rate in Hz. (default: 16,000) +.RE +.PP +\fB \-48 \fR +.RS 3n +Record input with 48kHz sampling, and down\-sample it to 16kHz on\-the\-fly. This option is valid for 16kHz model only. The down\-sampling routine was ported from +sptk. (Rev. 4.0) +.RE +.PP +\fB \-NA \fR \fIdevicename\fR +.RS 3n +Host name for DatLink server input (\fB\-input netaudio\fR). +.RE +.PP +\fB \-adport \fR \fIport_number\fR +.RS 3n +With +\fB\-input adinnet\fR, specify adinnet port number to listen. (default: 5530) +.RE +.PP +\fB \-nostrip \fR +.RS 3n +Julius by default removes successive zero samples in input speech data. This option stop it. +.RE +.PP +\fB \-C \fR \fIjconffile\fR +.RS 3n +Load a jconf file at here. The content of the jconffile will be expanded at this point. +.RE +.PP +\fB \-plugindir \fR \fIdirlist\fR +.RS 3n +Specify which directories to load plugin. If several direcotries exist, specify them by colon\-separated list. +.RE +.SH "ENVIRONMENT VARIABLES" +.PP +\fB \fR\fB\fBALSADEV\fR\fR\fB \fR +.RS 3n +(using mic input with alsa device) specify a capture device name. If not specified, "default" will be used. +.RE +.PP +\fB \fR\fB\fBAUDIODEV\fR\fR\fB \fR +.RS 3n +(using mic input with oss device) specify a capture device path. If not specified, "\fI/dev/dsp\fR" will be used. +.RE +.PP +\fB \fR\fB\fBLATENCY_MSEC\fR\fR\fB \fR +.RS 3n +Try to set input latency of microphone input in milliseconds. Smaller value will shorten latency but sometimes make process unstable. Default value will depend on the running OS. +.RE +.SH "EXAMPLES" +.PP +Record microphone input to files: "\fIdata.0000.wav\fR", "\fIdata.0001.wav\fR" and so on: +.sp .RS 3n .nf % \fBadintool\fR \-in mic \-out file \-filename data .fi .RE +Split a long speech file "\fIfoobar.raw\fR" into "\fIfoobar.1500.wav\fR", "\fIfoobar.1501.wav\fR" ...: +.sp .RS 3n .nf % \fBadintool\fR \-in file \-out file \-filename foobar \-startid 1500 % enter filename\->foobar.raw .fi .RE +Copy an entire audio file via network socket. +.sp .RS 3n .nf (sender) % \fBadintool\fR \-in file \-out adinnet \-server \fIreceiver_hostname\fR \-nosegment (receiver) % \fBadintool\fR \-in adinnet \-out file \-nosegment .fi .RE +Detect speech segment, send to Julius via network and recognize it: +.sp .RS 3n .nf (sender) % \fBadintool\fR \-in mic \-out adinnet \-server \fIreceiver_hostname\fR (receiver) % \fBjulius\fR \-C ... \-input adinnet .fi .RE +.SH "SEE ALSO" +.PP + +\fB julius \fR( 1 ) +, +\fB adinrec \fR( 1 ) +.SH "COPYRIGHT" +.PP +Copyright (c) 1997\-2000 Information\-technology Promotion Agency, Japan +.PP +Copyright (c) 1991\-2008 Kawahara Lab., Kyoto University +.PP +Copyright (c) 2000\-2005 Shikano Lab., Nara Institute of Science and Technology +.PP +Copyright (c) 2005\-2008 Julius project team, Nagoya Institute of Technology +.SH "LICENSE" +.PP +The same as Julius. Index: julius4/man/dfa_determinize.1 diff -u /dev/null julius4/man/dfa_determinize.1:1.1 --- /dev/null Thu Oct 2 17:23:48 2008 +++ julius4/man/dfa_determinize.1 Thu Oct 2 17:23:47 2008 @@ -0,0 +1,63 @@ +.\" Title: + dfa_determinize + +.\" Author: +.\" Generator: DocBook XSL Stylesheets v1.71.0 +.\" Date: 10/02/2008 +.\" Manual: +.\" Source: +.\" +.TH "DFA_DETERMINIZE" "1" "10/02/2008" "" "" +.\" disable hyphenation +.nh +.\" disable justification (adjust text to left margin only) +.ad l +.SH "NAME" + + dfa_determinize + \- Determinize NFA grammar network. +.SH "SYNOPSIS" +.HP 16 +\fBdfa_determinize\fR [\-o\ \fIoutfile\fR] {dfafile} +.SH "DESCRIPTION" +.PP + +\fBdfa_determinize\fR +converts a non\-deterministic .dfa file into deterministic DFA. Output to standard output, or file specified by "\fB\-o\fR" option. +.PP +This additional tool is not necessary on a grammar building procedure in Julius, since the grammar network generated by +\fBmkdfa.pl\fR +is always determinized. +.SH "OPTIONS" +.PP +\fB \-o \fR \fIoutfile\fR +.RS 3n +Outout file. If not specified, output to stdout. +.RE +.SH "EXAMPLES" +.PP +Determinize +\fIfoo.dfa\fR +to +\fIbar.dfa\fR: +.sp .RS 3n .nf % \fBdfa_determinize\fR \-o bar.dfa foo.dfa .fi .RE +Another way: +.sp .RS 3n .nf % \fBdfa_determinize\fR < foo.dfa > bar.dfa .fi .RE +.SH "SEE ALSO" +.PP + +\fB mkdfa.pl \fR( 1 ) +, +\fB dfa_minimize \fR( 1 ) +.SH "COPYRIGHT" +.PP +Copyright (c) 1997\-2000 Information\-technology Promotion Agency, Japan +.PP +Copyright (c) 1991\-2008 Kawahara Lab., Kyoto University +.PP +Copyright (c) 2000\-2005 Shikano Lab., Nara Institute of Science and Technology +.PP +Copyright (c) 2005\-2008 Julius project team, Nagoya Institute of Technology +.SH "LICENSE" +.PP +The same as Julius. Index: julius4/man/dfa_minimize.1 diff -u /dev/null julius4/man/dfa_minimize.1:1.1 --- /dev/null Thu Oct 2 17:23:48 2008 +++ julius4/man/dfa_minimize.1 Thu Oct 2 17:23:47 2008 @@ -0,0 +1,61 @@ +.\" Title: + dfa_minimize + +.\" Author: +.\" Generator: DocBook XSL Stylesheets v1.71.0 +.\" Date: 10/02/2008 +.\" Manual: +.\" Source: +.\" +.TH "DFA_MINIMIZE" "1" "10/02/2008" "" "" +.\" disable hyphenation +.nh +.\" disable justification (adjust text to left margin only) +.ad l +.SH "NAME" + + dfa_minimize + \- Minimize a DFA grammar network +.SH "SYNOPSIS" +.HP 13 +\fBdfa_minimize\fR [\-o\ \fIoutfile\fR] {dfafile} +.SH "DESCRIPTION" +.PP + +\fBdfa_minimize\fR +will convert an .dfa file to an equivalent minimal form. Output to standard output, or to a file specified by "\fB\-o\fR" option. +.PP +On version 3.5.3 and later, +\fBmkdfa.pl\fR +invokes this tool inside, and the output .dfa file will be always minimized, so you do not need to use this manually. +.SH "OPTIONS" +.PP +\fB \-o \fR \fIoutfile\fR +.RS 3n +Output file. If not specified output to standard output. +.RE +.SH "EXAMPLES" +.PP +Minimize +\fIfoo.dfa\fR +to +\fIbar.dfa\fR: +.sp .RS 3n .nf % \fBdfa_minimize\fR \-o bar.dfa foo.dfa .fi .RE +Another way: +.sp .RS 3n .nf % \fBdfa_minimize\fR < foo.dfa > bar.dfa .fi .RE +.SH "SEE ALSO" +.PP + +\fB mkdfa.pl \fR( 1 ) +.SH "COPYRIGHT" +.PP +Copyright (c) 1997\-2000 Information\-technology Promotion Agency, Japan +.PP +Copyright (c) 1991\-2008 Kawahara Lab., Kyoto University +.PP +Copyright (c) 2000\-2005 Shikano Lab., Nara Institute of Science and Technology +.PP +Copyright (c) 2005\-2008 Julius project team, Nagoya Institute of Technology +.SH "LICENSE" +.PP +The same as Julius. Index: julius4/man/generate-ngram.1 diff -u /dev/null julius4/man/generate-ngram.1:1.1 --- /dev/null Thu Oct 2 17:23:48 2008 +++ julius4/man/generate-ngram.1 Thu Oct 2 17:23:47 2008 @@ -0,0 +1,82 @@ +.\" Title: + generate\-ngram + +.\" Author: +.\" Generator: DocBook XSL Stylesheets v1.71.0 +.\" Date: 10/02/2008 +.\" Manual: +.\" Source: +.\" +.TH "GENERATE\-NGRAM" "1" "10/02/2008" "" "" +.\" disable hyphenation +.nh +.\" disable justification (adjust text to left margin only) +.ad l +.SH "NAME" + + generate\-ngram + \- random sentence generator from N\-gram +.SH "SYNOPSIS" +.HP 15 +\fBgenerate\-ngram\fR [\fIoptions\fR...] {\fIbinary_ngram\fR} +.SH "DESCRIPTION" +.PP + +\fBgenerate\-ngram\fR +is a tool to generate sentences randomly according to the given N\-gram language model. The N\-gram model file +\fIbinary_ngram\fR +should be an binary format. +.SH "OPTIONS" +.PP +\fB \-n \fR \fInum\fR +.RS 3n +Number of sentences to generate (default: 10) +.RE +.PP +\fB \-N \fR +.RS 3n +Specify which length of N\-gram to use (default: available max in the given model) +.RE +.PP +\fB \-bos \fR +.RS 3n +Beginning\-of\-sentence word (default: "") +.RE +.PP +\fB \-eos \fR +.RS 3n +End\-of\-sentence word (default: "") +.RE +.PP +\fB \-ignore \fR +.RS 3n +Specify a word to be supressed from output (default: " +.\" Date: 10/02/2008 +.\" Manual: +.\" Source: +.\" +.TH "GENERATE" "1" "10/02/2008" "" "" +.\" disable hyphenation +.nh +.\" disable justification (adjust text to left margin only) +.ad l +.SH "NAME" + + generate + \- random sentence generator from a grammar +.SH "SYNOPSIS" +.HP 9 +\fBgenerate\fR [\-v] [\-t] [\-n\ \fInum\fR] [\-s\ \fIspname\fR] {prefix} +.SH "DESCRIPTION" +.PP +This small program randomly generates sentences that are acceptable by the given grammar. +.PP + +\fI.dfa\fR, +\fI.dict\fR +and +\fI.term\fR +files are needed to execute. They can be generated from +\fI.grammar\fR +and +\fI.voca\fR +file by +\fBmkdfa.pl\fR. +.SH "OPTIONS" +.PP +\fB \-t \fR +.RS 3n +Output in word's category name. +.RE +.PP +\fB \-n \fR \fInum\fR +.RS 3n +Set number of sentences to be generated (default: 10) +.RE +.PP +\fB \-s \fR \fIspname\fR +.RS 3n +the name string of short\-pause word to be supressed (default: "sp") +.RE +.PP +\fB \-v \fR +.RS 3n +Debug output mode. +.RE +.SH "EXAMPLES" +.PP +Exmple output of a sample grammar "fruit": +.sp +.RS 3n +.nf +% \fBgenerate\fR fruit +Stat: init_voca: read 36 words +Reading in term file (optional)...done +15 categories, 36 words +DFA has 26 nodes and 42 arcs +\-\-\-\-\- + I WANT ONE APPLE + I WANT TEN PEARS + CAN I HAVE A PINEAPPLE + I WANT ONE PEAR + COULD I HAVE A BANANA + I WANT ONE APPLE PLEASE + I WANT NINE APPLES + NINE APPLES + I WANT ONE PINEAPPLE + I WANT A PEAR +.fi +.RE +.sp +.SH "SEE ALSO" +.PP + +\fB mkdfa.pl \fR( 1 ) +, +\fB generate\-ngram \fR( 1 ) +.SH "COPYRIGHT" +.PP +Copyright (c) 1997\-2000 Information\-technology Promotion Agency, Japan +.PP +Copyright (c) 1991\-2008 Kawahara Lab., Kyoto University +.PP +Copyright (c) 2000\-2005 Shikano Lab., Nara Institute of Science and Technology +.PP +Copyright (c) 2005\-2008 Julius project team, Nagoya Institute of Technology +.SH "LICENSE" +.PP +The same as Julius. Index: julius4/man/gram2sapixml.pl.1 diff -u /dev/null julius4/man/gram2sapixml.pl.1:1.1 --- /dev/null Thu Oct 2 17:23:48 2008 +++ julius4/man/gram2sapixml.pl.1 Thu Oct 2 17:23:47 2008 @@ -0,0 +1,54 @@ +.\" Title: + gram2sapixml.pl + +.\" Author: +.\" Generator: DocBook XSL Stylesheets v1.71.0 +.\" Date: 10/02/2008 +.\" Manual: +.\" Source: +.\" +.TH "GRAM2SAPIXML.PL" "1" "10/02/2008" "" "" +.\" disable hyphenation +.nh +.\" disable justification (adjust text to left margin only) +.ad l +.SH "NAME" + + gram2sapixml.pl + \- convert Julius grammar to SAPI XML grammar format +.SH "SYNOPSIS" +.HP 16 +\fBgram2sapixml.pl\fR [\fIprefix\fR...] +.SH "DESCRIPTION" +.PP + +\fBgram2sapixml.pl\fR +converts a recognition grammar file of Julius (.grammar, .voca) to Microsoft SAPI XML grammar format. +\fIprefix\fR +should be a file name of target grammar, excluding suffixes. If multiple argument is given, each will be process sequencialy in turn. +.PP +The internal character set should be in UTF\-8 format. By default +\fBgram2sapixml.pl\fR +assume input in EUC\-JP encoding and tries to convert it to UTF\-8 using +\fBiconv\fR. You may want to disable this feature within the script. +.PP +It will fail to convert a left recursive rule in the grammar. When fails, it will leave the source rules in the target .xml file, so you should modify the output manually to solve it. +.SH "SEE ALSO" +.PP + +\fB mkdfa.pl \fR( 1 ) +.SH "DIAGNOSTICS" +.PP +The conversion procedure is somewhat dumb one, only converting the non\-terminal symbols and terminal symbols (=word category name) into corresponding rules one by one. This is only a help tool, and you will need a manual inspection and editing to use it on a real SAPI application. +.SH "COPYRIGHT" +.PP +Copyright (c) 1997\-2000 Information\-technology Promotion Agency, Japan +.PP +Copyright (c) 1991\-2008 Kawahara Lab., Kyoto University +.PP +Copyright (c) 2000\-2005 Shikano Lab., Nara Institute of Science and Technology +.PP +Copyright (c) 2005\-2008 Julius project team, Nagoya Institute of Technology +.SH "LICENSE" +.PP +The same as Julius. Index: julius4/man/jclient.pl.1 diff -u /dev/null julius4/man/jclient.pl.1:1.1 --- /dev/null Thu Oct 2 17:23:48 2008 +++ julius4/man/jclient.pl.1 Thu Oct 2 17:23:47 2008 @@ -0,0 +1,49 @@ +.\" Title: + jclient.pl + +.\" Author: +.\" Generator: DocBook XSL Stylesheets v1.71.0 +.\" Date: 10/02/2008 +.\" Manual: +.\" Source: +.\" +.TH "JCLIENT.PL" "1" "10/02/2008" "" "" +.\" disable hyphenation +.nh +.\" disable justification (adjust text to left margin only) +.ad l +.SH "NAME" + + jclient.pl + \- sample client for module mode (perl version) +.SH "SYNOPSIS" +.HP 11 +\fBjclient.pl\fR +.SH "DESCRIPTION" +.PP +This is yet another sample client written in perl. It will connect to Julius running in module mode, receive recognition results from Julius, and cna send commands to control Julius. +.PP +This is a tiny program with only 57 lines. You can use it for free. +.SH "EXAMPLES" +.PP +Invoke Julius with module mode by specifying "\fB\-module\fR" option: +.sp .RS 3n .nf % \fBjulius\fR \-C ... \-module .fi .RE +Then, at other terminal or other host, invoke +\fBjclient.pl\fR +like below. The default hostname is "localhost", and port number is 10500. You can change them by editing the top part of the script. +.sp .RS 3n .nf % \fBjclient.pl\fR .fi .RE +It will then receive the outputs of Julius and output the raw message to standard out. Also, by inputting a raw module command to the standard input of +\fBjclient.pl\fR, it will be sent to Julius. See manuals for the specification of module mode. +.SH "SEE ALSO" +.PP + +\fB julius \fR( 1 ) +, +\fB jcontrol \fR( 1 ) +.SH "COPYRIGHT" +.PP +"\fBjclient.pl\fR" has been developed by Dr. Ryuichi Nisimura (nisimura @ sys.wakayama\-u.ac.jp). Use at your own risk. +.PP +If you have any feedback, comment or request, please contact the E\-mail address above, or look at the Web page below. +.PP +http://w3voice.jp/ Index: julius4/man/jcontrol.1 diff -u /dev/null julius4/man/jcontrol.1:1.1 --- /dev/null Thu Oct 2 17:23:48 2008 +++ julius4/man/jcontrol.1 Thu Oct 2 17:23:47 2008 @@ -0,0 +1,192 @@ +.\" Title: + jcontrol + +.\" Author: +.\" Generator: DocBook XSL Stylesheets v1.71.0 +.\" Date: 10/02/2008 +.\" Manual: +.\" Source: +.\" +.TH "JCONTROL" "1" "10/02/2008" "" "" +.\" disable hyphenation +.nh +.\" disable justification (adjust text to left margin only) +.ad l +.SH "NAME" + + jcontrol + \- a sample module client written in C +.SH "SYNOPSIS" +.HP 9 +\fBjcontrol\fR {\fIhostname\fR} [\fIportnum\fR] +.SH "DESCRIPTION" +.PP + +\fBjcontrol\fR +is a simple console program to control julius running on other host via network API. It can send command to Julius, and receive messages from Julius. +.PP +When invoked, jcontrol tries to connect to Julius running in "module mode" on specified hostname. After connection established, jcontrol waits for user commands from standard input. +.PP +When user types a command to jcontrol, it will be interpreted and cor\- responding API command will be sent to Julius. When a message is received from Julius, its content will be output to standard output. +.PP +For the details about the API, see the related documents. +.SH "OPTIONS" +.PP +\fB hostname \fR +.RS 3n +Host name where Julius is runnning in module mode. +.RE +.PP +\fB portnum \fR +.RS 3n +port number (default: 10500) +.RE +.SH "COMMANDS" +.PP + +\fBjcontrol\fR +interprets commands from standard input. Below is a list of all commands. +.SS "Engine control" +.PP +pause +.RS 3n +Stop Julius and enter into paused status. In paused status, Julius will not run recognition even if speech input occurs. When this command is issued while recognition is running, Julius will stop after the recognition has been finished. +.RE +.PP +terminate +.RS 3n +Same as +pause, but discard the current speech input when received command in the middle of recognition process. +.RE +.PP +resume +.RS 3n +Restart Julius that has been paused or terminated. +.RE +.PP +inputparam \fIarg\fR +.RS 3n +Tell Julius how to deal with speech input in case grammar is changed just when recognition is running. Specify one: "TERMINATE", "PAUSE" or "WAIT". +.RE +.PP +version +.RS 3n +Tell Julius to send version description string. +.RE +.PP +status +.RS 3n +Tell Julius to send the system status (active +/ +sleep) +.RE +.SS "Grammar handling" +.PP +changegram \fIprefix\fR +.RS 3n +Send a new grammar "\fIprefix.dfa\fR" and "\fIprefix.dict\fR", and tell julius to use it as a new grammar. All the current grammars used in the current process of Julius will be deleted and replaced to the specifed grammar. +.RE +.PP +addgram \fIprefix\fR +.RS 3n +Send a new grammar "\fIprefix.dfa\fR" and "\fIprefix.dict\fR" and add it to the current grammar. +.RE +.PP +deletegram \fIgramlist\fR +.RS 3n +Tell Julius to delete existing grammar. The grammar can be specified by either prefix name or number ID. The number ID can be determined from the message sent from Julius at each time grammar information has changed. When want to delete more than one grammar, specify all of them as comma\-sparated. +.RE +.PP +deactivategram \fIgramlist\fR +.RS 3n +Tell Julius to de\-activate a specified grammar. The specified grammar will still be kept but will not be used for recognition. +.sp +The target grammar can be specified by either prefix name or number ID. The number ID can be determined from the message sent from Julius at each time grammar information has changed. When want to delete more than one grammar, specify all of them as comma\-sparated. +.RE +.PP +activategram \fIgramlist\fR +.RS 3n +Tell Julius to activate previously de\-activated grammar. The target grammar can be specified by either prefix name or number ID. The number ID can be determined from the message sent from Julius at each time grammar information has changed. When want to delete more than one grammar, specify all of them as comma\-sparated. +.RE +.PP +addword \fIgrammar_name_or_id\fR \fIdictfile\fR +.RS 3n +Add the recognition word entries in the specified +\fIdictfile\fR +to the specified grammar on current process. +.RE +.PP +syncgram +.RS 3n +Force synchronize grammar status, like unix command "sync". +.RE +.SS "Process management" +.PP +Julius\-4 supports multi\-model recognition nad multi decoding. In this case it is possible to control each recognition process, as defined by "\fB\-SR\fR" option, from module client. +.PP +In multi decoding mode, the module client holds "current process", and the process commands and grammar related commands will be issued toward the current process. +.PP +listprocess +.RS 3n +Tell Julius to send the list of existing recognition process. +.RE +.PP +currentprocess \fIprocname\fR +.RS 3n +Switch the current process to the process specified by the name. +.RE +.PP +shiftprocess +.RS 3n +Rotate the current process. At each call the current process will be changed to the next one. +.RE +.PP +addprocess \fIjconffile\fR +.RS 3n +Tell Julisu to load a new recognition process into engine. The argument +\fIjconffile\fR +should be a jconf file that contains only one set of LM options and one SR definition. Note that the file should be visible on the running Julius, since +\fBjcontrol\fR +only send the path name and Julius actually read the jconf file. +.sp +The new LM and SR process will have the name of the jconffile. +.RE +.PP +delprocess \fIprocname\fR +.RS 3n +Delete the specified recognition process from the engine. +.RE +.PP +deactivateprocess \fIprocname\fR +.RS 3n +Tell Julius to temporary stop the specified recognition process. The stopped process will not be executed for the input until activated again. +.RE +.PP +activateprocess \fIprocname\fR +.RS 3n +Tell Julius to activate the temporarily stopped process. +.RE +.SH "EXAMPLES" +.PP +The dump messages from Julius are output to tty with prefix ">" appended to each line. Julius can be started in module mode like this: +.sp .RS 3n .nf % \fBjulius\fR \-C ... \-module .fi .RE +\fBjcontrol\fRcan be launched with the host name: +.sp .RS 3n .nf % \fBjcontrol\fR hostname .fi .RE +It will then receive the outputs of Julius and output the raw message to standard out. Also, by inputting the commands above to the standard input of +\fBjcontrol\fR, it will be sent to Julius. See manuals for the specification of module mode. +.SH "SEE ALSO" +.PP + +\fB julius \fR( 1 ) +.SH "COPYRIGHT" +.PP +Copyright (c) 1997\-2000 Information\-technology Promotion Agency, Japan +.PP +Copyright (c) 1991\-2008 Kawahara Lab., Kyoto University +.PP +Copyright (c) 2000\-2005 Shikano Lab., Nara Institute of Science and Technology +.PP +Copyright (c) 2005\-2008 Julius project team, Nagoya Institute of Technology +.SH "LICENSE" +.PP +The same as Julius. Index: julius4/man/julius.1 diff -u /dev/null julius4/man/julius.1:1.1 --- /dev/null Thu Oct 2 17:23:48 2008 +++ julius4/man/julius.1 Thu Oct 2 17:23:47 2008 @@ -0,0 +1,1500 @@ +.\" Title: + julius + +.\" Author: +.\" Generator: DocBook XSL Stylesheets v1.71.0 +.\" Date: 10/02/2008 +.\" Manual: +.\" Source: +.\" +.TH "JULIUS" "1" "10/02/2008" "" "" +.\" disable hyphenation +.nh +.\" disable justification (adjust text to left margin only) +.ad l +.SH "NAME" + + julius + \- open source multi\-purpose LVCSR engine +.SH "SYNOPSIS" +.HP 7 +\fBjulius\fR [\-C\ \fIjconffile\fR] [\fIoptions\fR...] +.SH "DESCRIPTION" +.PP + +\fBjulius\fR +is a high\-performance, multi\-purpose, open\-source speech recognition engine for researchers and developers. It is capable of performing almost real\-time recognition of continuous speech with over 60k\-word 3\-gram language model and triphone HMM model, on most current PCs. +\fBjulius\fR +can perform recognition on audio files, live microphone input, network input and feature parameter files. +.PP +The core recognition module is implemented as C library called "JuliusLib". It can also be extended by plug\-in facility. +.SS "Supported Models" +.PP +\fBjulius\fR +needs a language model and an acoustic model to run as a speech recognizer. +\fBjulius\fR +supports the following models. +.sp +.it 1 an-trap +.nr an-no-space-flag 1 +.nr an-break-flag 1 +.br +\fBAcoustic model\fR +.RS +.PP +Sub\-word HMM (Hidden Markov Model) in +HTK +ascii format are supported. Phoneme models (monophone), context dependent phoneme models (triphone), tied\-mixture and phonetic tied\-mixture models of any unit can be used. When using context dependent models, inter\-word context dependency is also handled. Multi\-stream feature and MSD\-HMM is also supported. You can further use a tool +\fBmkbinhmm\fR +to convert the ascii HMM file to a compact binary format for faster loading. +.PP +Note that +\fBjulius\fR +itself can only extract MFCC features from speech data. If you use acoustic HMM trained for other feature, you should give the input in +HTK +parameter file of the same feature type. +.RE +.sp +.it 1 an-trap +.nr an-no-space-flag 1 +.nr an-break-flag 1 +.br +\fBLanguage model: word N\-gram\fR +.RS +.PP +Word N\-gram language model, up to 10\-gram, is supported. Julius uses different N\-gram for each pass: left\-to\-right 2\-gram on 1st pass, and right\-to\-left N\-gram on 2nd pass. It is recommended to use both LR 2\-gram and RL N\-gram for Julius. However, you can use only single LR N\-gram or RL N\-gram. In such case, approximated LR 2\-gram computed from the given N\-gram will be applied at the first pass. +.PP +The Standard ARPA format is supported. In addition, a binary format is also supported for efficiency. The tool +\fBmkbingram\fR(1) +can convert ARPA format N\-gram to binary format. +.RE +.sp +.it 1 an-trap +.nr an-no-space-flag 1 +.nr an-break-flag 1 +.br +\fBLanguage model: grammar\fR +.RS +.PP +The grammar format is an original one, and tools to create a recognirion grammar are included in the distribution. A grammar consists of two files: one is a 'grammar' file that describes sentence structures in a BNF style, using word 'category' name as terminate symbols. Another is a 'voca' file that defines words with its pronunciations (i.e. phoneme sequences) for each category. They should be converted by +\fBmkdfa.pl\fR(1) +to a deterministic finite automaton file (.dfa) and a dictionary file (.dict), respectively. You can also use multiple grammars. +.RE +.sp +.it 1 an-trap +.nr an-no-space-flag 1 +.nr an-break-flag 1 +.br +\fBLanguage model: isolated word\fR +.RS +.PP +You can perform isolated word recognition using only word dictionary. With this model type, Julius will perform rapid one pass recognition with static context handling. Silence models will be added at both head and tail of each word. You can also use multiple dictionaries in a process. +.RE +.SS "Search Algorithm" +.PP +Recognition algorithm of +\fBjulius\fR +is based on a two\-pass strategy. Word 2\-gram and reverse word 3\-gram is used on the respective passes. The entire input is processed on the first pass, and again the final searching process is performed again for the input, using the result of the first pass to narrow the search space. Specifically, the recognition algorithm is based on a tree\-trellis heuristic search combined with left\-to\-right frame\-synchronous beam search and right\-to\-left stack decoding search. +.PP +When using context dependent phones (triphones), interword contexts are taken into consideration. For tied\-mixture and phonetic tied\-mixture models, high\-speed acoustic likelihood calculation is possible using gaussian pruning. +.PP +For more details, see the related documents. +.SH "OPTIONS" +.PP +These options specify the models, system behaviors and various search parameters to Julius. These option can be set at the command line, but it is recommended that you write them in a text file as a "jconf file", and specify it by "\-C" option. +.PP +Applications incorporating JuliusLib also use these options to set the parameters of core recognition engine. For example, a jconf file can be loaded to the enine by calling +\fBj_config_load_file_new()\fR +with the jconf file name as argument. +.PP +Please note that relative paths in a jconf file should be relative to the jconf file itself, not the current working directory. +.PP +Below are the details of all options, gathered by group. +.SS "Julius application option" +.PP +These are application options of Julius, outside of JuliusLib. It contains parameters and switches for result output, character set conversion, log level, and module mode options. These option are specific to Julius, and cannot be used at applications using JuliusLib other than Julius. +.PP +\fB \-outfile \fR +.RS 3n +On file input, this option write the recognition result of each file to a separate file. The output file of an input file will be the same name but the suffix will be changed to ".out". (rev.4.0) +.RE +.PP +\fB \-separatescore \fR +.RS 3n +Output the language and acoustic scores separately. +.RE +.PP +\fB \-callbackdebug \fR +.RS 3n +Print the callback names at each call for debug. (rev.4.0) +.RE +.PP +\fB \-charconv \fR \fIfrom\fR \fIto\fR +.RS 3n +Print with character set conversion. +\fIfrom\fR +is the source character set used in the language model, and +\fIto\fR +is the target character set you want to get. +.sp +On Linux, the arguments should be a code name. You can obtain the list of available code names by invoking the command "iconv \-\-list". On Windows, the arguments should be a code name or codepage number. Code name should be one of "ansi", "mac", "oem", "utf\-7", "utf\-8", "sjis", "euc". Or you can specify any codepage number supported at your environment. +.RE +.PP +\fB \-nocharconv \fR +.RS 3n +Disable character conversion. +.RE +.PP +\fB \-module \fR [port] +.RS 3n +Run Julius on "Server Module Mode". After startup, Julius waits for tcp/ip connection from client. Once connection is established, Julius start communication with the client to process incoming commands from the client, or to output recognition results, input trigger information and other system status to the client. The default port number is 10500. +.RE +.PP +\fB \-record \fR \fIdir\fR +.RS 3n +Auto\-save all input speech data into the specified directory. Each segmented inputs are recorded each by one. The file name of the recorded data is generated from system time when the input ends, in a style of +YYYY.MMDD.HHMMSS.wav. File format is 16bit monoral +WAV. Invalid for mfcfile input. +.sp +With input rejection by +\fB\-rejectshort\fR, the rejected input will also be recorded even if they are rejected. +.RE +.PP +\fB \-logfile \fR \fIfile\fR +.RS 3n +Save all log output to a file instead of standard output. (Rev.4.0) +.RE +.PP +\fB \-nolog \fR +.RS 3n +Disable all log output. (Rev.4.0) +.RE +.PP +\fB \-help \fR +.RS 3n +Output help message and exit. +.RE +.SS "Global options" +.PP +These are model\-/search\-dependent options relating audio input, sound detection, GMM, decoding algorithm, plugin facility, and others. Global options should be placed before any instance declaration (\fB\-AM\fR, +\fB\-LM\fR, or +\fB\-SR\fR), or just after "\fB\-GLOBAL\fR" option. +.sp +.it 1 an-trap +.nr an-no-space-flag 1 +.nr an-break-flag 1 +.br +\fBAudio input\fR +.RS +.PP +\fB \-input \fR {mic|rawfile|mfcfile|adinnet|stdin|netaudio|alsa|oss|esd} +.RS 3n +Choose speech input source. Specify 'file' or 'rawfile' for waveform file, 'htkparam' or 'mfcfile' for +HTK +parameter file. On file input, users will be prompted to enter the file name from stdin, or you can use +\fB\-filelist\fR +option to specify list of files to process. +.sp +\'mic' is to get audio input from a default live microphone device, and 'adinnet' means receiving waveform data via tcpip network from an adinnet client. 'netaudio' is from DatLink/NetAudio input, and 'stdin' means data input from standard input. +.sp +For waveform file input, only +WAV +(no compression) and +RAW +(noheader, 16bit, big endian) are supported by default. Other format can be read when compiled with +libsnd +library. To see what format is actually supported, see the help message using option +\fB\-help\fR. For stdin input, only WAV and RAW is supported. (default: mfcfile) +.sp +At Linux, you can choose API at run time by specifying +alsa, +oss +and +esd. +.RE +.PP +\fB \-filelist \fR \fIfilename\fR +.RS 3n +(With +\fB\-input rawfile|mfcfile\fR) perform recognition on all files listed in the file. The file should contain input file per line. Engine will end when all of the files are processed. +.RE +.PP +\fB \-notypecheck \fR +.RS 3n +By default, Julius checks the input parameter type whether it matches the AM or not. This option will disable the check and force engine to use the input vector as is. +.RE +.PP +\fB \-48 \fR +.RS 3n +Record input with 48kHz sampling, and down\-sample it to 16kHz on\-the\-fly. This option is valid for 16kHz model only. The down\-sampling routine was ported from +sptk. (Rev. 4.0) +.RE +.PP +\fB \-NA \fR \fIdevicename\fR +.RS 3n +Host name for DatLink server input (\fB\-input netaudio\fR). +.RE +.PP +\fB \-adport \fR \fIport_number\fR +.RS 3n +With +\fB\-input adinnet\fR, specify adinnet port number to listen. (default: 5530) +.RE +.PP +\fB \-nostrip \fR +.RS 3n +Julius by default removes successive zero samples in input speech data. This option inhibits the removal. +.RE +.PP +\fB \-zmean \fR, \fB \-nozmean \fR +.RS 3n +This option enables/disables DC offset removal of input waveform. Offset will be estimated from the whole input. For microphone / network input, zero mean of the first 48000 samples (3 seconds in 16kHz sampling) will be used for the estimation. (default: disabled) +.sp +This option uses static offset for the channel. See also +\fB\-zmeansource\fR +for frame\-wise offset removal. +.RE +.RE +.sp +.it 1 an-trap +.nr an-no-space-flag 1 +.nr an-break-flag 1 +.br +\fBSpeech detection by level and zero\-cross\fR +.RS +.PP +\fB \-cutsilence \fR, \fB \-nocutsilence \fR +.RS 3n +Turn on / off the speech detection by level and zero\-cross. Default is on for mic / adinnet input, and off for files. +.RE +.PP +\fB \-lv \fR \fIthres\fR +.RS 3n +Level threshold for speech input detection. Values should be in range from 0 to 32767. (default: 2000) +.RE +.PP +\fB \-zc \fR \fIthres\fR +.RS 3n +Zero crossing threshold per second. Only input that goes over the level threshold (\fB\-lv\fR) will be counted. (default: 60) +.RE +.PP +\fB \-headmargin \fR \fImsec\fR +.RS 3n +Silence margin at the start of speech segment in milliseconds. (default: 300) +.RE +.PP +\fB \-tailmargin \fR \fImsec\fR +.RS 3n +Silence margin at the end of speech segment in milliseconds. (default: 400) +.RE +.RE +.sp +.it 1 an-trap +.nr an-no-space-flag 1 +.nr an-break-flag 1 +.br +\fBInput rejection\fR +.RS +.PP +Two simple front\-end input rejection methods are implemented, based on input length and average power of detected segment. The rejection by average power is experimental, and can be enabled by +\-\-enable\-power\-reject +on compilation. Valid for MFCC feature with power coefficient and real\-time input only. +.PP +For GMM\-based input rejection see the GMM section below. +.PP +\fB \-rejectshort \fR \fImsec\fR +.RS 3n +Reject input shorter than specified milliseconds. Search will be terminated and no result will be output. +.RE +.PP +\fB \-powerthres \fR \fIthres\fR +.RS 3n +Reject the inputted segment by its average energy. If the average energy of the last recognized input is below the threshold, Julius will reject the input. (Rev.4.0) +.sp +This option is valid when +\-\-enable\-power\-reject +is specified at compilation time. +.RE +.RE +.sp +.it 1 an-trap +.nr an-no-space-flag 1 +.nr an-break-flag 1 +.br +\fBGaussian mixture model / GMM\-VAD\fR +.RS +.PP +GMM will be used for input rejection by accumulated score, or for front\-end GMM\-based VAD when +\-\-enable\-gmm\-vad +is specified. +.PP +NOTE: You should also set the proper MFCC parameters required for the GMM, specifying the acoustic parameters described in AM section +\fB\-AM_GMM\fR. +.PP +When GMM\-based VAD is enabled, the voice activity score will be calculated at each frame as front\-end processing. The value will be computed as \\[ \\max_{m \\in M_v} p(x|m) \- \\max_{m \\in M_n} p(x|m) \\] where $M_v$ is a set of voice GMM, and $M_n$ is a set of noise GMM whose names should be specified by +\fB\-gmmreject\fR. The activity score will be then averaged for the last N frames, where N is specified by +\fB\-gmmmargin\fR. Julius updates the averaged activity score at each frame, and detect speech up\-trigger when the value gets higher than a value specified by +\fB\-gmmup\fR, and detecgt down\-trigger when it gets lower than a value of +\fB\-gmmdown\fR. +.PP +\fB \-gmm \fR \fIhmmdefs_file\fR +.RS 3n +GMM definition file in +HTK +format. If specified, GMM\-based input verification will be performed concurrently with the 1st pass, and you can reject the input according to the result as specified by +\fB\-gmmreject\fR. The GMM should be defined as one\-state HMMs. +.RE +.PP +\fB \-gmmnum \fR \fInumber\fR +.RS 3n +Number of Gaussian components to be computed per frame on GMM calculation. Only the N\-best Gaussians will be computed for rapid calculation. The default is 10 and specifying smaller value will speed up GMM calculation, but too small value (1 or 2) may cause degradation of identification performance. +.RE +.PP +\fB \-gmmreject \fR \fIstring\fR +.RS 3n +Comma\-separated list of GMM names to be rejected as invalid input. When recognition, the log likelihoods of GMMs accumulated for the entire input will be computed concurrently with the 1st pass. If the GMM name of the maximum score is within this string, the 2nd pass will not be executed and the input will be rejected. +.RE +.PP +\fB \-gmmmargin \fR \fIframes\fR +.RS 3n +(GMM_VAD) Head margin in frames. When a speech trigger detected by GMM, recognition will start from current frame minus this value. (Rev.4.0) +.sp +This option will be valid only if compiled with +\-\-enable\-gmm\-vad. +.RE +.PP +\fB \-gmmup \fR \fIvalue\fR +.RS 3n +(GMM_VAD) Up trigger threshold of voice activity score. (Rev.4.1) +.sp +This option will be valid only if compiled with +\-\-enable\-gmm\-vad. +.RE +.PP +\fB \-gmmdown \fR \fIvalue\fR +.RS 3n +(GMM_VAD) Down trigger threshold of voice activity score. (Rev.4.1) +.sp +This option will be valid only if compiled with +\-\-enable\-gmm\-vad. +.RE +.RE +.sp +.it 1 an-trap +.nr an-no-space-flag 1 +.nr an-break-flag 1 +.br +\fBDecoding option\fR +.RS +.PP +Real\-time processing means concurrent processing of MFCC computation 1st pass decoding. By default, real\-time processing on the pass is on for microphone / adinnet / netaudio input, and for others. +.PP +\fB \-realtime \fR, \fB \-norealtime \fR +.RS 3n +Explicitly switch on / off real\-time (pipe\-line) processing on the first pass. The default is off for file input, and on for microphone, adinnet and NetAudio input. This option relates to the way CMN and energy normalization is performed: if off, they will be done using average features of whole input. If on, MAP\-CMN and energy normalization to do real\-time processing. +.RE +.RE +.sp +.it 1 an-trap +.nr an-no-space-flag 1 +.nr an-break-flag 1 +.br +\fBMisc. options\fR +.RS +.PP +\fB \-C \fR \fIjconffile\fR +.RS 3n +Load a jconf file at here. The content of the jconffile will be expanded at this point. +.RE +.PP +\fB \-version \fR +.RS 3n +Print version information to standard error, and exit. +.RE +.PP +\fB \-setting \fR +.RS 3n +Print engine setting information to standard error, and exit. +.RE +.PP +\fB \-quiet \fR +.RS 3n +Output less log. For result, only the best word sequence will be printed. +.RE +.PP +\fB \-debug \fR +.RS 3n +(For debug) output enormous internal message and debug information to log. +.RE +.PP +\fB \-check \fR {wchmm|trellis|triphone} +.RS 3n +For debug, enter interactive check mode. +.RE +.PP +\fB \-plugindir \fR \fIdirlist\fR +.RS 3n +Specify directory to load plugin. If several direcotries exist, specify them by colon\-separated list. +.RE +.RE +.SS "Instance declaration for multi decoding" +.PP +The following arguments will create a new configuration set with default parameters, and switch current set to it. Jconf parameters specified after the option will be set into the current set. +.PP +To do multi\-model decoding, these argument should be specified at the first of each model / search instances with different names. Any options before the first instance definition will be IGNORED. +.PP +When no instance definition is found (as older version of Julius), all the options are assigned to a default instance named +_default. +.PP +Please note that decoding with a single LM and multiple AMs is not fully supported. For example, you may want to construct the jconf file as following. +.sp .RS 3n .nf \-AM am_1 \-AM am_2 \-LM lm (LM spec..) \-SR search1 am_1 lm \-SR search2 am_2 lm .fi .RE +This type of model sharing is not supported yet, since some part of LM processing depends on the assigned AM. Instead, you can get the same result by defining the same LMs for each AM, like this: +.sp .RS 3n .nf \-AM am_1 \-AM am_2 \-LM lm_1 (LM spec..) \-LM lm_2 (same LM spec..) \-SR search1 am_1 lm_1 \-SR search2 am_2 lm_2 .fi .RE +.PP +\fB \-AM \fR \fIname\fR +.RS 3n +Create a new AM configuration set, and switch current to the new one. You should give a unique name. (Rev.4.0) +.RE +.PP +\fB \-LM \fR \fIname\fR +.RS 3n +Create a new LM configuration set, and switch current to the new one. You should give a unique name. (Rev.4.0) +.RE +.PP +\fB \-SR \fR \fIname\fR \fIam_name\fR \fIlm_name\fR +.RS 3n +Create a new search configuration set, and switch current to the new one. The specified AM and LM will be assigned to it. The +\fIam_name\fR +and +\fIlm_name\fR +can be either name or ID number. You should give a unique name. (Rev.4.0) +.RE +.PP +\fB \-AM_GMM \fR +.RS 3n +When using GMM for front\-end processing, you can specify GMM\-specific acoustic parameters after this option. If you does not specify +\fB\-AM_GMM\fR +with GMM, the GMM will share the same parameter vector as the last AM. The current AM will be switched to the GMM one, so be careful not to confuse with normal AM configurations. (Rev.4.0) +.RE +.PP +\fB \-GLOBAL \fR +.RS 3n +Start a global section. The global options should be placed before any instance declaration, or after this option on multiple model recognition. This can be used multiple times. (Rev.4.1) +.RE +.PP +\fB \-nosectioncheck \fR, \fB \-sectioncheck \fR +.RS 3n +Disable / enable option location check in multi\-model decoding. When enabled, the options between instance declaration is treated as "sections" and only the belonging option types can be written. For example, when an option +\fB\-AM\fR +is specified, only the AM related option can be placed after the option until other declaration is found. Also, global options should be placed at top, before any instance declarataion. This is enabled by default. (Rev.4.1) +.RE +.SS "Language model (\fB\-LM\fR)" +.PP +This group contains options for model definition of each language model type. When using multiple LM, one instance can have only one LM. +.PP +Only one type of LM can be specified for a LM configuration. If you want to use multi model, you should define them one as a new LM. +.sp +.it 1 an-trap +.nr an-no-space-flag 1 +.nr an-break-flag 1 +.br +\fBN\-gram\fR +.RS +.PP +\fB \-d \fR \fIbingram_file\fR +.RS 3n +Use binary format N\-gram. An ARPA N\-gram file can be converted to Julius binary format by +mkbingram. +.RE +.PP +\fB \-nlr \fR \fIarpa_ngram_file\fR +.RS 3n +A forward, left\-to\-right N\-gram language model in standard ARPA format. When both a forward N\-gram and backward N\-gram are specified, Julius uses this forward 2\-gram for the 1st pass, and the backward N\-gram for the 2nd pass. +.sp +Since ARPA file often gets huge and requires a lot of time to load, it may be better to convert the ARPA file to Julius binary format by +mkbingram. Note that if both forward and backward N\-gram is used for recognition, they together will be converted to a single binary. +.sp +When only a forward N\-gram is specified by this option and no backward N\-gram specified by +\fB\-nrl\fR, Julius performs recognition with only the forward N\-gram. The 1st pass will use the 2\-gram entry in the given N\-gram, and The 2nd pass will use the given N\-gram, with converting forward probabilities to backward probabilities by Bayes rule. (Rev.4.0) +.RE +.PP +\fB \-nrl \fR \fIarpa_ngram_file\fR +.RS 3n +A backward, right\-to\-left N\-gram language model in standard ARPA format. When both a forward N\-gram and backward N\-gram are specified, Julius uses the forward 2\-gram for the 1st pass, and this backward N\-gram for the 2nd pass. +.sp +Since ARPA file often gets huge and requires a lot of time to load, it may be better to convert the ARPA file to Julius binary format by +mkbingram. Note that if both forward and backward N\-gram is used for recognition, they together will be converted to a single binary. +.sp +When only a backward N\-gram is specified by this option and no forward N\-gram specified by +\fB\-nlr\fR, Julius performs recognition with only the backward N\-gram. The 1st pass will use the forward 2\-gram probability computed from the backward 2\-gram using Bayes rule. The 2nd pass fully use the given backward N\-gram. (Rev.4.0) +.RE +.PP +\fB \-v \fR \fIdict_file\fR +.RS 3n +Word dictionary file. +.RE +.PP +\fB \-silhead \fR \fIword_string\fR \fB \-siltail \fR \fIword_string\fR +.RS 3n +Silence word defined in the dictionary, for silences at the beginning of sentence and end of sentence. (default: "", "") +.RE +.PP +\fB \-iwspword \fR +.RS 3n +Add a word entry to the dictionary that should correspond to inter\-word pauses. This may improve recognition accuracy in some language model that has no explicit inter\-word pause modeling. The word entry to be added can be changed by +\fB\-iwspentry\fR. +.RE +.PP +\fB \-iwspentry \fR \fIword_entry_string\fR +.RS 3n +Specify the word entry that will be added by +\fB\-iwspword\fR. (default: " [sp] sp sp") +.RE +.PP +\fB \-sepnum \fR \fInumber\fR +.RS 3n +Number of high frequency words to be isolated from the lexicon tree, to ease approximation error that may be caused by the one\-best approximation on 1st pass. (default: 150) +.RE +.RE +.sp +.it 1 an-trap +.nr an-no-space-flag 1 +.nr an-break-flag 1 +.br +\fBGrammar\fR +.RS +.PP +Multiple grammars can be specified by repeating +\fB\-gram\fR +and +\fB\-gramlist\fR. Note that this is unusual behavior from other options (in normal Julius option, last one will override previous ones). You can use +\fB\-nogram\fR +to reset the grammars already specified before the point. +.PP +\fB \-gram \fR gramprefix1[,gramprefix2[,gramprefix3,...]] +.RS 3n +Comma\-separated list of grammars to be used. the argument should be a prefix of a grammar, i.e. if you have +\fIfoo.dfa\fR +and +\fIfoo.dict\fR, you should specify them with a single argument +foo. Multiple grammars can be specified at a time as a comma\-separated list. +.RE +.PP +\fB \-gramlist \fR \fIlist_file\fR +.RS 3n +Specify a grammar list file that contains list of grammars to be used. The list file should contain the prefixes of grammars, each per line. A relative path in the list file will be treated as relative to the file, not the current path or configuration file. +.RE +.PP +\fB \-dfa \fR \fIdfa_file\fR \fB \-v \fR \fIdict_file\fR +.RS 3n +An old way of specifying grammar files separately. This is bogus, and should not be used any more. +.RE +.PP +\fB \-nogram \fR +.RS 3n +Remove the current list of grammars already specified by +\fB\-gram\fR, +\fB\-gramlist\fR, +\fB\-dfa\fR +and +\fB\-v\fR. +.RE +.RE +.sp +.it 1 an-trap +.nr an-no-space-flag 1 +.nr an-break-flag 1 +.br +\fBIsolated word\fR +.RS +.PP +Dictionary can be specified by using +\fB\-w\fR +and +\fB\-wlist\fR. When you specify multiple times, all of them will be read at startup. You can use +\fB\-nogram\fR +to reset the already specified dictionaries at that point. +.PP +\fB \-w \fR \fIdict_file\fR +.RS 3n +Word dictionary for isolated word recognition. File format is the same as other LM. (Rev.4.0) +.RE +.PP +\fB \-wlist \fR \fIlist_file\fR +.RS 3n +Specify a dictionary list file that contains list of dictionaries to be used. The list file should contain the file name of dictionaries, each per line. A relative path in the list file will be treated as relative to the list file, not the current path or configuration file. (Rev.4.0) +.RE +.PP +\fB \-nogram \fR +.RS 3n +Remove the current list of dictionaries already specified by +\fB\-w\fR +and +\fB\-wlist\fR. +.RE +.PP +\fB \-wsil \fR \fIhead_sil_model_name\fR \fItail_sil_model_name\fR \fIsil_context_name\fR +.RS 3n +On isolated word recognition, silence models will be appended to the head and tail of each word at recognition. This option specifies the silence models to be appended. +\fIsil_context_name\fR +is the name of the head sil model and tail sil model as a context of word head phone and tail phone. For example, if you specify +\-wsil silB silE sp, a word with phone sequence +b eh t +will be translated as +silB sp\-b+eh b\-eh+t eh\-t+sp silE. (Rev.4.0) +.RE +.RE +.sp +.it 1 an-trap +.nr an-no-space-flag 1 +.nr an-break-flag 1 +.br +\fBUser\-defined LM\fR +.RS +.PP +\fB \-userlm \fR +.RS 3n +Declare to use user LM functions in the program. This option should be specified if you use user\-defined LM functions. (Rev.4.0) +.RE +.RE +.sp +.it 1 an-trap +.nr an-no-space-flag 1 +.nr an-break-flag 1 +.br +\fBMisc. LM options\fR +.RS +.PP +\fB \-forcedict \fR +.RS 3n +Skip error words in dictionary and force running. +.RE +.RE +.SS "Acoustic model and feature analysis (\fB\-AM\fR) (\fB\-AM_GMM\fR)" +.PP +This section is about options for acoustic model, feature extraction, feature normalizations and spectral subtraction. +.PP +After +\-AM name, an acoustic model and related specification should be written. You can use multiple AMs trained with different MFCC types. For GMM, the required parameter condition should be specified just as same as AMs after +\fB\-AM_GMM\fR. +.PP +When using multiple AMs, the values of +\fB\-smpPeriod\fR, +\fB\-smpFreq\fR, +\fB\-fsize\fR +and +\fB\-fshift\fR +should be the same among all AMs. +.sp +.it 1 an-trap +.nr an-no-space-flag 1 +.nr an-break-flag 1 +.br +\fBAcoustic HMM\fR +.RS +.PP +\fB \-h \fR \fIhmmdef_file\fR +.RS 3n +Acoustic HMM definition file. It should be in +HTK +ascii format, or Julius binary format. You can convert +HTK +ascii format to Julius binary format using +mkbinhmm. +.RE +.PP +\fB \-hlist \fR \fIhmmlist_file\fR +.RS 3n +HMMList file for phone mapping. This file provides mapping between logical triphone names generated in the dictionary and the defined HMM names in hmmdefs. This option should be specified for context\-dependent model. +.RE +.PP +\fB \-tmix \fR \fInumber\fR +.RS 3n +Specify the number of top Gaussians to be calculated in a mixture codebook. Small number will speed up the acoustic computation, but AM accuracy may get worse with too small value. See also +\fB\-gprune\fR. (default: 2) +.RE +.PP +\fB \-spmodel \fR \fIname\fR +.RS 3n +Specify HMM model name that corresponds to short\-pause in an utterance. The short\-pause model name will be used in recognition: short\-pause skipping on grammar recognition, word\-end short\-pause model insertion with +\fB\-iwsp\fR +on N\-gram, or short\-pause segmentation (\fB\-spsegment\fR). (default: "sp") +.RE +.PP +\fB \-multipath \fR +.RS 3n +Enable multi\-path mode. To make decoding faster, Julius by default impose a limit on HMM transitions that each model should have only one transition from initial state and to end state. On multi\-path mode, Julius does extra handling on inter\-model transition to allows model\-skipping transition and multiple output/input transitions. Note that specifying this option will make Julius a bit slower, and the larger beam width may be required. +.sp +This function was a compilation\-time option on Julius 3.x, and now becomes a run\-time option. By default (without this option), Julius checks the transition type of specified HMMs, and enable the multi\-path mode if required. You can force multi\-path mode with this option. (rev.4.0) +.RE +.PP +\fB \-gprune \fR {safe|heuristic|beam|none|default} +.RS 3n +Set Gaussian pruning algorithm to use. For tied\-mixture model, Julius performs Gaussian pruning to reduce acoustic computation, by calculating only the top N Gaussians in each codebook at each frame. The default setting will be set according to the model type and engine setting. +default +will force accepting the default setting. Set this to +none +to disable pruning and perform full computation. +safe +guarantees the top N Gaussians to be computed. +heuristic +and +beam +do more aggressive computational cost reduction, but may result in small loss of accuracy model (default: +safe +(standard), +beam +(fast) for tied mixture model, +none +for non tied\-mixture model). +.RE +.PP +\fB \-iwcd1 \fR {max|avg|best number} +.RS 3n +Select method to approximate inter\-word triphone on the head and tail of a word in the first pass. +.sp + +max +will apply the maximum likelihood of the same context triphones. +avg +will apply the average likelihood of the same context triphones. +best number +will apply the average of top N\-best likelihoods of the same context triphone. +.sp +Default is +best 3 +for use with N\-gram, and +avg +for grammar and word. When this AM is shared by LMs of both type, latter one will be chosen. +.RE +.PP +\fB \-iwsppenalty \fR \fIfloat\fR +.RS 3n +Insertion penalty for word\-end short pauses appended by +\fB\-iwsp\fR. +.RE +.PP +\fB \-gshmm \fR \fIhmmdef_file\fR +.RS 3n +If this option is specified, Julius performs Gaussian Mixture Selection for efficient decoding. The hmmdefs should be a monophone model generated from an ordinary monophone HMM model, using +mkgshmm. +.RE +.PP +\fB \-gsnum \fR \fInumber\fR +.RS 3n +On GMS, specify number of monophone states to compute corresponding triphones in detail. (default: 24) +.RE +.RE +.sp +.it 1 an-trap +.nr an-no-space-flag 1 +.nr an-break-flag 1 +.br +\fBSpeech analysis\fR +.RS +.PP +Only MFCC feature extraction is supported in current Julius. Thus when recognizing a waveform input from file or microphone, AM must be trained by MFCC. The parameter condition should also be set as exactly the same as the training condition by the options below. +.PP +When you give an input in +HTK +Parameter file, you can use any parameter type for AM. In this case Julius does not care about the type of input feature and AM, just read them as vector sequence and match them to the given AM. Julius only checks whether the parameter types are the same. If it does not work well, you can disable this checking by +\fB\-notypecheck\fR. +.PP +In Julius, the parameter kind and qualifiers (as +TARGETKIND +in +HTK) and the number of cepstral parameters (NUMCEPS) will be set automatically from the content of the AM header, so you need not specify them by options. +.PP +Other parameters should be set exactly the same as training condition. You can also give a +HTK +Config file which you used to train AM to Julius by +\fB\-htkconf\fR. When this option is applied, Julius will parse the Config file and set appropriate parameter. +.PP +You can further embed those analysis parameter settings to a binary HMM file using +mkbinhmm. +.PP +If options specified in several ways, they will be evaluated in the order below. The AM embedded parameter will be loaded first if any. Then, the +HTK +config file given by +\fB\-htkconf\fR +will be parsed. If a value already set by AM embedded value, +HTK +config will override them. At last, the direct options will be loaded, which will override settings loaded before. Note that, when the same options are specified several times, later will override previous, except that +\fB\-htkconf\fR +will be evaluated first as described above. +.PP +\fB \-smpPeriod \fR \fIperiod\fR +.RS 3n +Sampling period of input speech, in unit of 100 nanoseconds. Sampling rate can also be specified by +\fB\-smpFreq\fR. Please note that the input frequency should be set equal to the training conditions of AM. (default: 625, corresponds to 16,000Hz) +.sp +This option corresponds to the +HTK +Option +SOURCERATE. The same value can be given to this option. +.sp +When using multiple AM, this value should be the same among all AMs. +.RE +.PP +\fB \-smpFreq \fR \fIHz\fR +.RS 3n +Set sampling frequency of input speech in Hz. Sampling rate can also be specified using +\fB\-smpPeriod\fR. Please note that this frequency should be set equal to the training conditions of AM. (default: 16,000) +.sp +When using multiple AM, this value should be the same among all AMs. +.RE +.PP +\fB \-fsize \fR \fIsample_num\fR +.RS 3n +Window size in number of samples. (default: 400) +.sp +This option corresponds to the +HTK +Option +WINDOWSIZE, but value should be in samples (HTK +value / smpPeriod). +.sp +When using multiple AM, this value should be the same among all AMs. +.RE +.PP +\fB \-fshift \fR \fIsample_num\fR +.RS 3n +Frame shift in number of samples. (default: 160) +.sp +This option corresponds to the +HTK +Option +TARGETRATE, but value should be in samples (HTK +value / smpPeriod). +.sp +When using multiple AM, this value should be the same among all AMs. +.RE +.PP +\fB \-preemph \fR \fIfloat\fR +.RS 3n +Pre\-emphasis coefficient. (default: 0.97) +.sp +This option corresponds to the +HTK +Option +PREEMCOEF. The same value can be given to this option. +.RE +.PP +\fB \-fbank \fR \fInum\fR +.RS 3n +Number of filterbank channels. (default: 24) +.sp +This option corresponds to the +HTK +Option +NUMCHANS. The same value can be given to this option. Be aware that the default value not the same as in +HTK +(22). +.RE +.PP +\fB \-ceplif \fR \fInum\fR +.RS 3n +Cepstral liftering coefficient. (default: 22) +.sp +This option corresponds to the +HTK +Option +CEPLIFTER. The same value can be given to this option. +.RE +.PP +\fB \-rawe \fR, \fB \-norawe \fR +.RS 3n +Enable/disable using raw energy before pre\-emphasis (default: disabled) +.sp +This option corresponds to the +HTK +Option +RAWENERGY. Be aware that the default value differs from +HTK +(enabled at +HTK, disabled at Julius). +.RE +.PP +\fB \-enormal \fR, \fB \-noenormal \fR +.RS 3n +Enable/disable normalizing log energy. On live input, this normalization will be approximated from the average of last input. (default: disabled) +.sp +This option corresponds to the +HTK +Option +ENORMALISE. Be aware that the default value differs from +HTK +(enabled at +HTK, disabled at Julius). +.RE +.PP +\fB \-escale \fR \fIfloat_scale\fR +.RS 3n +Scaling factor of log energy when normalizing log energy. (default: 1.0) +.sp +This option corresponds to the +HTK +Option +ESCALE. Be aware that the default value differs from +HTK +(0.1). +.RE +.PP +\fB \-silfloor \fR \fIfloat\fR +.RS 3n +Energy silence floor in dB when normalizing log energy. (default: 50.0) +.sp +This option corresponds to the +HTK +Option +SILFLOOR. +.RE +.PP +\fB \-delwin \fR \fIframe\fR +.RS 3n +Delta window size in number of frames. (default: 2) +.sp +This option corresponds to the +HTK +Option +DELTAWINDOW. The same value can be given to this option. +.RE +.PP +\fB \-accwin \fR \fIframe\fR +.RS 3n +Acceleration window size in number of frames. (default: 2) +.sp +This option corresponds to the +HTK +Option +ACCWINDOW. The same value can be given to this option. +.RE +.PP +\fB \-hifreq \fR \fIHz\fR +.RS 3n +Enable band\-limiting for MFCC filterbank computation: set upper frequency cut\-off. Value of \-1 will disable it. (default: \-1) +.sp +This option corresponds to the +HTK +Option +HIFREQ. The same value can be given to this option. +.RE +.PP +\fB \-lofreq \fR \fIHz\fR +.RS 3n +Enable band\-limiting for MFCC filterbank computation: set lower frequency cut\-off. Value of \-1 will disable it. (default: \-1) +.sp +This option corresponds to the +HTK +Option +LOFREQ. The same value can be given to this option. +.RE +.PP +\fB \-zmeanframe \fR, \fB \-nozmeanframe \fR +.RS 3n +With speech input, this option enables/disables frame\-wise DC offset removal. This corresponds to +HTK +configuration +ZMEANSOURCE. This cannot be used together with +\fB\-zmean\fR. (default: disabled) +.RE +.PP +\fB \-usepower \fR +.RS 3n +Use power instead of magnitude on filterbank analysis. (default: disabled) +.RE +.RE +.sp +.it 1 an-trap +.nr an-no-space-flag 1 +.nr an-break-flag 1 +.br +\fBNormalization\fR +.RS +.PP +Julius can perform cepstral mean normalization (CMN) for inputs. CMN will be activated when the given AM was trained with CMN (i.e. has "_Z" qualifier in the header). +.PP +The cepstral mean will be estimated in different way according to the input type. On file input, the mean will be computed from the whole input. On live input such as microphone and network input, the ceptral mean of the input is unknown at the start. So MAP\-CMN will be used. On MAP\-CMN, an initial mean vector will be applied at the beginning, and the mean vector will be smeared to the mean of the incrementing input vector as input goes. Options below can control the behavior of MAP\-CMN. +.PP +\fB \-cvn \fR +.RS 3n +Enable cepstral variance normalization. At file input, the variance of whole input will be calculated and then applied. At live microphone input, variance of the last input will be applied. CVN is only supported for an audio input. +.RE +.PP +\fB \-vtln \fR \fIalpha\fR \fIlowcut\fR \fIhicut\fR +.RS 3n +Do frequency warping, typically for a vocal tract length normalization (VTLN). Arguments are warping factor, high frequency cut\-off and low freq. cut\-off. They correspond to +HTK +Config values, +WARPFREQ, +WARPHCUTOFF +and +WARPLCUTOFF. +.RE +.PP +\fB \-cmnload \fR \fIfile\fR +.RS 3n +Load initial cepstral mean vector from file on startup. The +\fIfile\fR +should be one saved by +\fB\-cmnsave\fR. Loading an initial cepstral mean enables Julius to better recognize the first utterance on a real\-time input. When used together with +\fB\-cmnnoupdate\fR, this initial value will be used for all input. +.RE +.PP +\fB \-cmnsave \fR \fIfile\fR +.RS 3n +Save the calculated cepstral mean vector into +\fIfile\fR. The parameters will be saved at each input end. If the output file already exists, it will be overridden. +.RE +.PP +\fB \-cmnupdate \fR \fB \-cmnnoupdate \fR +.RS 3n +Control whether to update the cepstral mean at each input on real\-time input. Disabling this and specifying +\fB\-cmnload\fR +will make engine to always use the loaded static initial cepstral mean. +.RE +.PP +\fB \-cmnmapweight \fR \fIfloat\fR +.RS 3n +Specify the weight of initial cepstral mean for MAP\-CMN. Specify larger value to retain the initial cepstral mean for a longer period, and smaller value to make the cepstral mean rely more on the current input. (default: 100.0) +.RE +.RE +.sp +.it 1 an-trap +.nr an-no-space-flag 1 +.nr an-break-flag 1 +.br +\fBFront\-end processing\fR +.RS +.PP +Julius can perform spectral subtraction to reduce some stationary noise from audio input. Though it is not a powerful method, but it may work on some situation. Julius has two ways to estimate noise spectrum. One way is to assume that the first short segment of an speech input is noise segment, and estimate the noise spectrum as the average of the segment. Another way is to calculate average spectrum from noise\-only input using other tool +mkss, and load it in Julius. The former one is popular for speech file input, and latter should be used in live input. The options below will switch / control the behavior. +.PP +\fB \-sscalc \fR +.RS 3n +Perform spectral subtraction using head part of each file as silence part. The head part length should be specified by +\fB\-sscalclen\fR. Valid only for file input. Conflict with +\fB\-ssload\fR. +.RE +.PP +\fB \-sscalclen \fR \fImsec\fR +.RS 3n +With +\fB\-sscalc\fR, specify the length of head silence for noise spectrum estimation in milliseconds. (default: 300) +.RE +.PP +\fB \-ssload \fR \fIfile\fR +.RS 3n +Perform spectral subtraction for speech input using pre\-estimated noise spectrum loaded from +\fIfile\fR. The noise spectrum file can be made by +mkss. Valid for all speech input. Conflict with +\fB\-sscalc\fR. +.RE +.PP +\fB \-ssalpha \fR \fIfloat\fR +.RS 3n +Alpha coefficient of spectral subtraction for +\fB\-sscalc\fR +and +\fB\-ssload\fR. Noise will be subtracted stronger as this value gets larger, but distortion of the resulting signal also becomes remarkable. (default: 2.0) +.RE +.PP +\fB \-ssfloor \fR \fIfloat\fR +.RS 3n +Flooring coefficient of spectral subtraction. The spectral power that goes below zero after subtraction will be substituted by the source signal with this coefficient multiplied. (default: 0.5) +.RE +.RE +.sp +.it 1 an-trap +.nr an-no-space-flag 1 +.nr an-break-flag 1 +.br +\fBMisc. AM options\fR +.RS +.PP +.PP +\fB \-htkconf \fR \fIfile\fR +.RS 3n +Parse the given +HTK +Config file, and set corresponding parameters to Julius. When using this option, the default parameter values are switched from Julius defaults to +HTK +defaults. +.RE +.RE +.SS "Recognition process and search (\fB\-SR\fR)" +.PP +This section contains options for search parameters on the 1st / 2nd pass such as beam width and LM weights, configurations for short\-pause segmentation, switches for word lattice output and confusion network output, forced alignments, and other options relating recognition process and result output. +.PP +Default values for beam width and LM weights will change according to compile\-time setup of JuliusLib , AM model type, and LM size. Please see the startup log for the actual values. +.sp +.it 1 an-trap +.nr an-no-space-flag 1 +.nr an-break-flag 1 +.br +\fB1st pass parameters\fR +.RS +.PP +\fB \-lmp \fR \fIweight\fR \fIpenalty\fR +.RS 3n +(N\-gram) Language model weights and word insertion penalties for the first pass. +.RE +.PP +\fB \-penalty1 \fR \fIpenalty\fR +.RS 3n +(Grammar) word insertion penalty for the first pass. (default: 0.0) +.RE +.PP +\fB \-b \fR \fIwidth\fR +.RS 3n +Beam width in number of HMM nodes for rank beaming on the first pass. This value defines search width on the 1st pass, and has dominant effect on the total processing time. Smaller width will speed up the decoding, but too small value will result in a substantial increase of recognition errors due to search failure. Larger value will make the search stable and will lead to failure\-free search, but processing time will grow in proportion to the width. +.sp +The default value is dependent on acoustic model type: 400 (monophone), 800 (triphone), or 1000 (triphone, setup=v2.1) +.RE +.PP +\fB \-nlimit \fR \fInum\fR +.RS 3n +Upper limit of token per node. This option is valid when +\-\-enable\-wpair +and +\-\-enable\-wpair\-nlimit +are enabled at compilation time. +.RE +.PP +\fB \-progout \fR +.RS 3n +Enable progressive output of the partial results on the first pass. +.RE +.PP +\fB \-proginterval \fR \fImsec\fR +.RS 3n +Set the time interval for +\fB\-progout\fR +in milliseconds. (default: 300) +.RE +.RE +.sp +.it 1 an-trap +.nr an-no-space-flag 1 +.nr an-break-flag 1 +.br +\fB2nd pass parameters\fR +.RS +.PP +\fB \-lmp2 \fR \fIweight\fR \fIpenalty\fR +.RS 3n +(N\-gram) Language model weights and word insertion penalties for the second pass. +.RE +.PP +\fB \-penalty2 \fR \fIpenalty\fR +.RS 3n +(Grammar) word insertion penalty for the second pass. (default: 0.0) +.RE +.PP +\fB \-b2 \fR \fIwidth\fR +.RS 3n +Envelope beam width (number of hypothesis) at the second pass. If the count of word expansion at a certain hypothesis length reaches this limit while search, shorter hypotheses are not expanded further. This prevents search to fall in breadth\-first\-like situation stacking on the same position, and improve search failure mostly for large vocabulary condition. (default: 30) +.RE +.PP +\fB \-sb \fR \fIfloat\fR +.RS 3n +Score envelope width for enveloped scoring. When calculating hypothesis score for each generated hypothesis, its trellis expansion and Viterbi operation will be pruned in the middle of the speech if score on a frame goes under the width. Giving small value makes the second pass faster, but computation error may occur. (default: 80.0) +.RE +.PP +\fB \-s \fR \fInum\fR +.RS 3n +Stack size, i.e. the maximum number of hypothesis that can be stored on the stack during the search. A larger value may give more stable results, but increases the amount of memory required. (default: 500) +.RE +.PP +\fB \-m \fR \fIcount\fR +.RS 3n +Number of expanded hypotheses required to discontinue the search. If the number of expanded hypotheses is greater then this threshold then, the search is discontinued at that point. The larger this value is, The longer Julius gets to give up search. (default: 2000) +.RE +.PP +\fB \-n \fR \fInum\fR +.RS 3n +The number of candidates Julius tries to find. The search continues till this number of sentence hypotheses have been found. The obtained sentence hypotheses are sorted by score, and final result is displayed in the order (see also the +\fB\-output\fR). The possibility that the optimum hypothesis is correctly found increases as this value gets increased, but the processing time also becomes longer. The default value depends on the engine setup on compilation time: 10 (standard) or 1 (fast or v2.1) +.RE +.PP +\fB \-output \fR \fInum\fR +.RS 3n +The top N sentence hypothesis to be output at the end of search. Use with +\fB\-n\fR +(default: 1) +.RE +.PP +\fB \-lookuprange \fR \fIframe\fR +.RS 3n +Set the number of frames before and after to look up next word hypotheses in the word trellis on the second pass. This prevents the omission of short words, but with a large value, the number of expanded hypotheses increases and system becomes slow. (default: 5) +.RE +.PP +\fB \-looktrellis \fR +.RS 3n +(Grammar) Expand only the words survived on the first pass instead of expanding all the words predicted by grammar. This option makes second pass decoding faster especially for large vocabulary condition, but may increase deletion error of short words. (default: disabled) +.RE +.RE +.sp +.it 1 an-trap +.nr an-no-space-flag 1 +.nr an-break-flag 1 +.br +\fBShort\-pause segmentation / decoder\-VAD\fR +.RS +.PP +When compiled with +\-\-enable\-decoder\-vad, the short\-pause segmentation will be extended to support decoder\-based VAD. +.PP +\fB \-spsegment \fR +.RS 3n +Enable short\-pause segmentation mode. Input will be segmented when a short pause word (word with only silence model in pronunciation) gets the highest likelihood at certain successive frames on the first pass. When detected segment end, Julius stop the 1st pass at the point, perform 2nd pass, and continue with next segment. The word context will be considered among segments. (Rev.4.0) +.sp +When compiled with +\-\-enable\-decoder\-vad, this option enables decoder\-based VAD, to skip long silence. +.RE +.PP +\fB \-spdur \fR \fIframe\fR +.RS 3n +Short pause duration length to detect end of input segment, in number of frames. (default: 10) +.RE +.PP +\fB \-pausemodels \fR \fIstring\fR +.RS 3n +A comma\-separated list of pause model names to be used at short\-pause segmentation. The word whose pronunciation consists of only the pause models will be treated as "pause word" and used for pause detection. If not specified, name of +\fB\-spmodel\fR, +\fB\-silhead\fR +and +\fB\-siltail\fR +will be used. (Rev.4.0) +.RE +.PP +\fB \-spmargin \fR \fIframe\fR +.RS 3n +Back step margin at trigger up for decoder\-based VAD. When speech up\-trigger found by decoder\-VAD, Julius will rewind the input parameter by this value, and start recognition at the point. (Rev.4.0) +.sp +This option will be valid only if compiled with +\-\-enable\-decoder\-vad. +.RE +.PP +\fB \-spdelay \fR \fIframe\fR +.RS 3n +Trigger decision delay frame at trigger up for decoder\-based VAD. (Rev.4.0) +.sp +This option will be valid only if compiled with +\-\-enable\-decoder\-vad. +.RE +.RE +.sp +.it 1 an-trap +.nr an-no-space-flag 1 +.nr an-break-flag 1 +.br +\fBWord lattice / confusion network output\fR +.RS +.PP +\fB \-lattice \fR, \fB \-nolattice \fR +.RS 3n +Enable / disable generation of word graph. Search algorithm also has changed to optimize for better word graph generation, so the sentence result may not be the same as normal N\-best recognition. (Rev.4.0) +.RE +.PP +\fB \-confnet \fR, \fB \-noconfnet \fR +.RS 3n +Enable / disable generation of confusion network. Enabling this will also activates +\fB\-lattice\fR +internally. (Rev.4.0) +.RE +.PP +\fB \-graphrange \fR \fIframe\fR +.RS 3n +Merge same words at neighbor position at graph generation. If the beginning time and ending time of two word candidates of the same word is within the specified range, they will be merged. The default is 0 (allow merging same words on exactly the same location) and specifying larger value will result in smaller graph output. Setting this value to +\-1 +will disable merging, in that case same words on the same location of different scores will be left as they are. (default: 0) +.RE +.PP +\fB \-graphcut \fR \fIdepth\fR +.RS 3n +Cut the resulting graph by its word depth at post\-processing stage. The depth value is the number of words to be allowed at a frame. Setting to \-1 disables this feature. (default: 80) +.RE +.PP +\fB \-graphboundloop \fR \fIcount\fR +.RS 3n +Limit the number of boundary adjustment loop at post\-processing stage. This parameter prevents Julius from blocking by infinite adjustment loop by short word oscillation. (default: 20) +.RE +.PP +\fB \-graphsearchdelay \fR, \fB \-nographsearchdelay \fR +.RS 3n +When this option is enabled, Julius modifies its graph generation algorithm on the 2nd pass not to terminate search by graph merging, until the first sentence candidate is found. This option may improve graph accuracy, especially when you are going to generate a huge word graph by setting broad search. Namely, it may result in better graph accuracy when you set wide beams on both 1st pass +\fB\-b\fR +and 2nd pass +\fB\-b2\fR, and large number for +\fB\-n\fR. (default: disabled) +.RE +.RE +.sp +.it 1 an-trap +.nr an-no-space-flag 1 +.nr an-break-flag 1 +.br +\fBMulti\-gram / multi\-dic recognition\fR +.RS +.PP +\fB \-multigramout \fR, \fB \-nomultigramout \fR +.RS 3n +On grammar recognition using multiple grammars, Julius will output only the best result among all grammars. Enabling this option will make Julius to output result for each grammar. (default: disabled) +.RE +.RE +.sp +.it 1 an-trap +.nr an-no-space-flag 1 +.nr an-break-flag 1 +.br +\fBForced alignment\fR +.RS +.PP +\fB \-walign \fR +.RS 3n +Do viterbi alignment per word units for the recognition result. The word boundary frames and the average acoustic scores per frame will be calculated. +.RE +.PP +\fB \-palign \fR +.RS 3n +Do viterbi alignment per phone units for the recognition result. The phone boundary frames and the average acoustic scores per frame will be calculated. +.RE +.PP +\fB \-salign \fR +.RS 3n +Do viterbi alignment per state for the recognition result. The state boundary frames and the average acoustic scores per frame will be calculated. +.RE +.RE +.sp +.it 1 an-trap +.nr an-no-space-flag 1 +.nr an-break-flag 1 +.br +\fBMisc. search options\fR +.RS +.PP +\fB \-inactive \fR +.RS 3n +Start this recognition process instance with inactive state. (Rev.4.0) +.RE +.PP +\fB \-1pass \fR +.RS 3n +Perform only the first pass. +.RE +.PP +\fB \-fallback1pass \fR +.RS 3n +When 2nd pass fails, Julius finish the recognition with no result. This option tell Julius to output the 1st pass result as a final result when the 2nd pass fails. Note that some score output (confidence etc.) may not be useful. This was the default behavior of Julius\-3.x. +.RE +.PP +\fB \-no_ccd \fR, \fB \-force_ccd \fR +.RS 3n +Explicitly switch phone context handling at search. Normally Julius determines whether the using AM is a context\-dependent model or not from the model names, i.e., whether the names contain character ++ +and +\-. This option will override the automatic detection. +.RE +.PP +\fB \-cmalpha \fR \fIfloat\fR +.RS 3n +Smoothing parameter for confidence scoring. (default: 0.05) +.RE +.PP +\fB \-iwsp \fR +.RS 3n +(Multi\-path mode only) Enable inter\-word context\-free short pause insertion. This option appends a skippable short pause model for every word end. The short\-pause model can be specified by +\fB\-spmodel\fR. +.RE +.PP +\fB \-transp \fR \fIfloat\fR +.RS 3n +Additional insertion penalty for transparent words. (default: 0.0) +.RE +.PP +\fB \-demo \fR +.RS 3n +Equivalent to +\fB\-progout \-quiet\fR. +.RE +.RE +.SH "ENVIRONMENT VARIABLES" +.PP +\fB \fR\fB\fBALSADEV\fR\fR\fB \fR +.RS 3n +(using mic input with alsa device) specify a capture device name. If not specified, "default" will be used. +.RE +.PP +\fB \fR\fB\fBAUDIODEV\fR\fR\fB \fR +.RS 3n +(using mic input with oss device) specify a capture device path. If not specified, "\fI/dev/dsp\fR" will be used. +.RE +.PP +\fB \fR\fB\fBLATENCY_MSEC\fR\fR\fB \fR +.RS 3n +Try to set input latency of microphone input in milliseconds. Smaller value will shorten latency but sometimes make process unstable. Default value will depend on the running OS. +.RE +.SH "EXAMPLES" +.PP +For examples of system usage, refer to the tutorial section in the Julius documents. +.SH "NOTICE" +.PP +Note about jconf files: relative paths in a jconf file are interpreted as relative to the jconf file itself, not to the current directory. +.SH "SEE ALSO" +.PP +\fBjulian\fR(1), +\fBjcontrol\fR(1), +\fBadinrec\fR(1), +\fBadintool\fR(1), +\fBmkbingram\fR(1), +\fBmkbinhmm\fR(1), +\fBmkgsmm\fR(1), wav2\fBmfcc\fR(1), +\fBmkss\fR(1) +.PP +\fIhttp://julius.sourceforge.jp/en/\fR +.SH "DIAGNOSTICS" +.PP +Julius normally will return the exit status 0. If an error occurs, Julius exits abnormally with exit status 1. If an input file cannot be found or cannot be loaded for some reason then Julius will skip processing for that file. +.SH "BUGS" +.PP +There are some restrictions to the type and size of the models Julius can use. For a detailed explanation refer to the Julius documentation. For bug\-reports, inquires and comments please contact julius\-info at lists.sourceforge.jp. +.SH "COPYRIGHT" +.PP +Copyright (c) 1991\-2008 Kawahara Lab., Kyoto University +.PP +Copyright (c) 1997\-2000 Information\-technology Promotion Agency, Japan +.PP +Copyright (c) 2000\-2008 Shikano Lab., Nara Institute of Science and Technology +.PP +Copyright (c) 2005\-2008 Julius project team, Nagoya Institute of Technology +.SH "AUTHORS" +.PP +Rev.1.0 (1998/02/20) +.RS 3n +Designed by Tatsuya KAWAHARA and Akinobu LEE (Kyoto University) +.sp +Development by Akinobu LEE (Kyoto University) +.RE +.PP +Rev.1.1 (1998/04/14), Rev.1.2 (1998/10/31), Rev.2.0 (1999/02/20), Rev.2.1 (1999/04/20), Rev.2.2 (1999/10/04), Rev.3.0 (2000/02/14), Rev.3.1 (2000/05/11) +.RS 3n +Development of above versions by Akinobu LEE (Kyoto University) +.RE +.PP +Rev.3.2 (2001/08/15), Rev.3.3 (2002/09/11), Rev.3.4 (2003/10/01), Rev.3.4.1 (2004/02/25), Rev.3.4.2 (2004/04/30) +.RS 3n +Development of above versions by Akinobu LEE (Nara Institute of Science and Technology) +.RE +.PP +Rev.3.5 (2005/11/11), Rev.3.5.1 (2006/03/31), Rev.3.5.2 (2006/07/31), Rev.3.5.3 (2006/12/29), Rev.4.0 (2007/12/19), Rev.4.1 (2008/10/03) +.RS 3n +Development of above versions by Akinobu LEE (Nagoya Institute of Technology) +.RE +.SH "THANKS TO" +.PP +From rev.3.2, Julius is released by the "Information Processing Society, Continuous Speech Consortium". +.PP +The Windows DLL version was developed and released by Hideki BANNO (Nagoya University). +.PP +The Windows Microsoft Speech API compatible version was developed by Takashi SUMIYOSHI (Kyoto University). Index: julius4/man/mkbingram.1 diff -u /dev/null julius4/man/mkbingram.1:1.1 --- /dev/null Thu Oct 2 17:23:48 2008 +++ julius4/man/mkbingram.1 Thu Oct 2 17:23:47 2008 @@ -0,0 +1,99 @@ +.\" Title: + mkbingram + +.\" Author: +.\" Generator: DocBook XSL Stylesheets v1.71.0 +.\" Date: 10/02/2008 +.\" Manual: +.\" Source: +.\" +.TH "MKBINGRAM" "1" "10/02/2008" "" "" +.\" disable hyphenation +.nh +.\" disable justification (adjust text to left margin only) +.ad l +.SH "NAME" + + mkbingram + \- make binary N\-gram from ARPA N\-gram file +.SH "SYNOPSIS" +.HP 10 +\fBmkbingram\fR [\-nlr\ \fIforward_ngram.arpa\fR] [\-nrl\ \fIbackward_ngram.arpa\fR] [\-d\ \fIold_bingram_file\fR] {output_bingram_file} +.SH "DESCRIPTION" +.PP + +\fBmkbingram\fR +is a tool to convert N\-gram definition file(s) in ARPA standard format to a compact Julius binary format. It will speed up the initial loading time of N\-gram much faster. It can read gzipped file directly. +.PP +From rev.4.0, Julius can deal with forward N\-gram, backward N\-gram and their combinations. So, +\fBmkbingram\fR +now generates binary N\-gram file from one of them, or combining them two to produce one binary N\-gram. +.PP +When only a forward N\-gram is specified, +\fBmkbingram\fR +generates binary N\-gram from only the forward N\-gram. When using this binary N\-gram at Julius, it performs the 1st pass with the 2\-gram probabilities in the N\-gram, and run the 2nd pass with the given N\-gram fully, with converting forward probabilities to backward probabilities by Bayes rule. +.PP +When only a backward N\-gram is specified, +\fBmkbingram\fR +generates an binary N\-gram file that contains only the backward N\-gram. The 1st pass will use forward 2\-gram probabilities that can be computed from the backward 2\-gram using Bayes rule, and the 2nd pass use the given backward N\-gram fully. +.PP +When both forward and backward N\-grams are specified, the 2\-gram part in the forward N\-gram and all backward N\-gram will be combined into single bingram file. The forward 2\-gram will be applied for the 1st pass and backward N\-gram for the 2nd pass. Note that both N\-gram should be trained in the same corpus with same parameters (i.e. cut\-off thresholds), with same vocabulary. +.PP +The old binary N\-gram produced by +\fBmkbingram\fR +of version 3.x and earlier can be used in Julius\-4, but you can convert the old version to the new version by specifying it as input of current +\fBmkbingram\fR +by option "\fB\-d\fR". +.PP +Please note that binary N\-gram file converted by +\fBmkbingram\fR +of version 4.0 and later cannot be read by older Julius 3.x. +.SH "OPTIONS" +.PP +\fB \-nlr \fR \fIforward_ngram.arpa\fR +.RS 3n +Read in a forward (left\-to\-right) word N\-gram file in ARPA standard format. +.RE +.PP +\fB \-nrl \fR \fIbackward_ngram.arpa\fR +.RS 3n +Read in a backward (right\-to\-left) word N\-gram file in ARPA standard format. +.RE +.PP +\fB \-d \fR \fIold_bingram_file\fR +.RS 3n +Read in a binary N\-gram file. +.RE +.PP +\fIoutput_bingram_file\fR +.RS 3n +binary N\-gram file name to output. +.RE +.SH "EXAMPLES" +.PP +Convert a set of forward and backward N\-gram in ARPA format into Julius binary form: +.sp .RS 3n .nf % \fBmkbingram\fR \-nlr 2gram.arpa \-nrl rev\-Ngram.arpa outfile .fi .RE +Convert a single forward 4\-gram in ARPA format into a binary file: +.sp .RS 3n .nf % \fBmkbingram\fR \-nlr 4gram.arpa outfile .fi .RE +Convert old binary N\-gram file to current format: +.sp .RS 3n .nf % \fBmkbingram\fR \-d old_bingram new_bingram .fi .RE +.SH "SEE ALSO" +.PP + +\fB julius \fR( 1 ) +, +\fB mkbinhmm \fR( 1 ) +, +\fB mkbinhmmlist \fR( 1 ) +.SH "COPYRIGHT" +.PP +Copyright (c) 1997\-2000 Information\-technology Promotion Agency, Japan +.PP +Copyright (c) 1991\-2008 Kawahara Lab., Kyoto University +.PP +Copyright (c) 2000\-2005 Shikano Lab., Nara Institute of Science and Technology +.PP +Copyright (c) 2005\-2008 Julius project team, Nagoya Institute of Technology +.SH "LICENSE" +.PP +The same as Julius. Index: julius4/man/mkbinhmm.1 diff -u /dev/null julius4/man/mkbinhmm.1:1.1 --- /dev/null Thu Oct 2 17:23:48 2008 +++ julius4/man/mkbinhmm.1 Thu Oct 2 17:23:47 2008 @@ -0,0 +1,80 @@ +.\" Title: + mkbinhmm + +.\" Author: +.\" Generator: DocBook XSL Stylesheets v1.71.0 +.\" Date: 10/02/2008 +.\" Manual: +.\" Source: +.\" +.TH "MKBINHMM" "1" "10/02/2008" "" "" +.\" disable hyphenation +.nh +.\" disable justification (adjust text to left margin only) +.ad l +.SH "NAME" + + mkbinhmm + \- convert HMM definition file in HTK ascii format to Julius binary format +.SH "SYNOPSIS" +.HP 9 +\fBmkbinhmm\fR [\-htkconf\ \fIHTKConfigFile\fR] {hmmdefs_file} {binhmm_file} +.SH "DESCRIPTION" +.PP + +\fBmkbinhmm\fR +convert an HMM definition file in HTK ascii format into a binary HMM file for Julius. It will greatly speed up the launch process. +.PP +You can also embed acoustic analysis condition parameters needed for recognition into the output file. To embed the parameters, specify the HTK Config file you have used to extract acoustic features for training the HMM by the optione "\fB\-htkconf\fR". +.PP +The embedded parameters in a binary HMM format will be loaded into Julius automatically, so you do not need to specify the acoustic feature options at run time. It will be convenient when you deliver an acoustic model. +.PP +You can also specify binary file as the input. This can be used to update the old binary format into new one, or to embed the config parameters into the already existing binary files. If the input binhmm already has acoustic analysis parameters embedded, they will be overridden by the specified values. +.PP + +\fBmkbinhmm\fR +can read gzipped file as input. +.SH "OPTIONS" +.PP +\fB \-htkconf \fR \fIHTKConfigFile\fR +.RS 3n +HTK Config file you used at training time. If specified, the values are embedded to the output file. +.RE +.PP +\fIhmmdefs_file\fR +.RS 3n +The source HMm definitino file in HTK ascii format or Julius binary format. +.RE +.PP +\fIhmmdefs_file\fR +.RS 3n +Output file. +.RE +.SH "EXAMPLES" +.PP +Convert HTK ascii format HMM definition file into Julius binary file: +.sp .RS 3n .nf % \fBmkbinhmm\fR hmmdefs.ascii binhmm .fi .RE +Furthermore, embed acoustic feature parameters as specified by Config file +.sp .RS 3n .nf % \fBmkbinhmm\fR \-htkconf Config hmmdefs.ascii binhmm .fi .RE +Embed the acoustic parameters into an existing binary file +.sp .RS 3n .nf % \fBmkbingram\fR \-htkconf Config old_binhmm new_binhmm .fi .RE +.SH "SEE ALSO" +.PP + +\fB julius \fR( 1 ) +, +\fB mkbingram \fR( 1 ) +, +\fB mkbinhmmlist \fR( 1 ) +.SH "COPYRIGHT" +.PP +Copyright (c) 1997\-2000 Information\-technology Promotion Agency, Japan +.PP +Copyright (c) 1991\-2008 Kawahara Lab., Kyoto University +.PP +Copyright (c) 2000\-2005 Shikano Lab., Nara Institute of Science and Technology +.PP +Copyright (c) 2005\-2008 Julius project team, Nagoya Institute of Technology +.SH "LICENSE" +.PP +The same as Julius. Index: julius4/man/mkbinhmmlist.1 diff -u /dev/null julius4/man/mkbinhmmlist.1:1.1 --- /dev/null Thu Oct 2 17:23:48 2008 +++ julius4/man/mkbinhmmlist.1 Thu Oct 2 17:23:47 2008 @@ -0,0 +1,77 @@ +.\" Title: + mkbinhmmlist + +.\" Author: +.\" Generator: DocBook XSL Stylesheets v1.71.0 +.\" Date: 10/02/2008 +.\" Manual: +.\" Source: +.\" +.TH "MKBINHMMLIST" "1" "10/02/2008" "" "" +.\" disable hyphenation +.nh +.\" disable justification (adjust text to left margin only) +.ad l +.SH "NAME" + + mkbinhmmlist + \- convert HMMList file into binary format +.SH "SYNOPSIS" +.HP 13 +\fBmkbinhmmlist\fR {hmmdefs_file} {HMMList_file} {output_binhmmlist_file} +.SH "DESCRIPTION" +.PP + +\fBmkbinhmmlist\fR +converts a HMMList file to binary format. Since the index trees for lookup are also stored in the binary format, it will speed up the startup of Julius, namely when using big HMMList file. +.PP +For conversion, HMM definition file +\fIhmmdefs_file\fR +that will be used together at Julius needs to be specified. The format of the HMM definition file can be either ascii or Julius binary format. +.PP +The output binary file can be used in Julius as the same by "\fB\-hlist\fR". The format wil be auto\-detected by Julius. +.PP + +\fBmkbinhmmlist\fR +can read gzipped file. +.SH "OPTIONS" +.PP +\fIhmmdefs_file\fR +.RS 3n +Acoustic HMM definition file, in HMM ascii format or Julius binary format. +.RE +.PP +\fIHMMList_file\fR +.RS 3n +Source HMMList file +.RE +.PP +\fIoutput_binhmmlist_file\fR +.RS 3n +Output file, will be overwritten if already exist. +.RE +.SH "EXAMPLES" +.PP +Convert a HMMList file +\fIlogicalTri\fR +into binary format and store to +\fIlogicalTri.bin\fR: +.sp .RS 3n .nf % \fBmkbinhmmlist\fR binhmm logicalTri logicalTri.bin .fi .RE +.SH "SEE ALSO" +.PP + +\fB julius \fR( 1 ) +, +\fB mkbinhmm \fR( 1 ) +.SH "COPYRIGHT" +.PP +Copyright (c) 1997\-2000 Information\-technology Promotion Agency, Japan +.PP +Copyright (c) 1991\-2008 Kawahara Lab., Kyoto University +.PP +Copyright (c) 2000\-2005 Shikano Lab., Nara Institute of Science and Technology +.PP +Copyright (c) 2005\-2008 Julius project team, Nagoya Institute of Technology +.SH "LICENSE" +.PP +The same as Julius. Index: julius4/man/mkdfa.pl.1 diff -u /dev/null julius4/man/mkdfa.pl.1:1.1 --- /dev/null Thu Oct 2 17:23:48 2008 +++ julius4/man/mkdfa.pl.1 Thu Oct 2 17:23:47 2008 @@ -0,0 +1,111 @@ +.\" Title: + mkdfa.pl + +.\" Author: +.\" Generator: DocBook XSL Stylesheets v1.71.0 +.\" Date: 10/02/2008 +.\" Manual: +.\" Source: +.\" +.TH "MKDFA.PL" "1" "10/02/2008" "" "" +.\" disable hyphenation +.nh +.\" disable justification (adjust text to left margin only) +.ad l +.SH "NAME" + + mkdfa.pl + \- grammar compiler +.SH "SYNOPSIS" +.HP 9 +\fBmkdfa.pl\fR [\fIoptions\fR...] {prefix} +.SH "DESCRIPTION" +.PP + +\fBmkdfa.pl\fR +compiles the Julian format grammar (\fI.grammar\fR +and +\fI.voca\fR) to Julian native formats (\fI.dfa\fR +and +\fI.dict\fR). In addition, "\fI.term\fR" will be also generated that stores correspondence of category ID used in the output files to the source category name. +.PP + +prefix +should be the common file name prefix of "\fI.grammar\fR" and "voca" file. From +prefix.grammar +and +prefix.voca +file, +prefix.dfa, +prefix.dict +and +prefix.term +will be output. +.SH "OPTIONS" +.PP +\fB \-n \fR +.RS 3n +Not process dictionary. You can only convert +\fI.grammar\fR +file to +\fI.dfa\fR +file without +\fI.voca\fR +file. +.RE +.SH "ENVIRONMENT VARIABLES" +.PP +\fB \fR\fB\fBTMP\fR\fR\fB or \fR\fB\fBTEMP\fR\fR\fB \fR +.RS 3n +Set directory to store temporal file. If not specified, one of them on the following list will be used: +\fI/tmp\fR, +\fI/var/tmp\fR, +\fI/WINDOWS/Temp\fR, +\fI/WINNT/Temp\fR. +.RE +.SH "EXAMPLES" +.PP +Convert a grammar +\fIfoo.grammar\fR +and +\fIfoo.voca\fR +to +\fIfoo.dfa\fR, +\fIfoo.voca\fR +and +\fIfoo.term\fR. +.sp .RS 3n .nf % \fBmkdfa.pl\fR foo .fi .RE +.SH "SEE ALSO" +.PP + +\fB julius \fR( 1 ) +, +\fB generate \fR( 1 ) +, +\fB nextword \fR( 1 ) +, +\fB accept_check \fR( 1 ) +, +\fB dfa_minimize \fR( 1 ) +.SH "DIAGNOSTICS" +.PP + +\fBmkdfa.pl\fR +invokes +\fBmkfa\fR +and +\fBdfa_minimize\fR +internally. They should be placed at the same directory as +\fBmkdfa.pl\fR. +.SH "COPYRIGHT" +.PP +Copyright (c) 1997\-2000 Information\-technology Promotion Agency, Japan +.PP +Copyright (c) 1991\-2008 Kawahara Lab., Kyoto University +.PP +Copyright (c) 2000\-2005 Shikano Lab., Nara Institute of Science and Technology +.PP +Copyright (c) 2005\-2008 Julius project team, Nagoya Institute of Technology +.SH "LICENSE" +.PP +The same as Julius. Index: julius4/man/mkgshmm.1 diff -u /dev/null julius4/man/mkgshmm.1:1.1 --- /dev/null Thu Oct 2 17:23:48 2008 +++ julius4/man/mkgshmm.1 Thu Oct 2 17:23:47 2008 @@ -0,0 +1,52 @@ +.\" Title: + mkgshmm + +.\" Author: +.\" Generator: DocBook XSL Stylesheets v1.71.0 +.\" Date: 10/02/2008 +.\" Manual: +.\" Source: +.\" +.TH "MKGSHMM" "1" "10/02/2008" "" "" +.\" disable hyphenation +.nh +.\" disable justification (adjust text to left margin only) +.ad l +.SH "NAME" + + mkgshmm + \- convert monophone HMM to GS HMM for Julius +.SH "SYNOPSIS" +.HP 8 +\fBmkgshmm\fR {monophone_hmmdefs} + > + {outputfile} +.SH "DESCRIPTION" +.PP +mkgshmm converts monophone HMM definition file in HTK format into a special format for Gaussian Mixture Selection (GMS) in Julius. +.PP +GMS is an algorithm to reduce the amount of acoustic computation with triphone HMM, by pre\-selection of promising gaussian mixtures using likelihoods of corresponding monophone mixtures. +.SH "EXAMPLES" +.PP +(1) Prepare a monophone model which was trained by the same corpus as target triphone model. +.PP +(2) Convert the monophone model using mkgshmm. +.sp .RS 3n .nf % \fBmkgshmm\fR monophone > gshmmfile .fi .RE +(3) Specify the output file in Julius with option "\-gshmm" +.sp .RS 3n .nf % \fBjulius\fR \-C ... \-gshmm gshmmfile .fi .RE +.SH "SEE ALSO" +.PP + +\fB julius \fR( 1 ) +.SH "COPYRIGHT" +.PP +Copyright (c) 1997\-2000 Information\-technology Promotion Agency, Japan +.PP +Copyright (c) 1991\-2008 Kawahara Lab., Kyoto University +.PP +Copyright (c) 2000\-2005 Shikano Lab., Nara Institute of Science and Technology +.PP +Copyright (c) 2005\-2008 Julius project team, Nagoya Institute of Technology +.SH "LICENSE" +.PP +The same as Julius. Index: julius4/man/mkss.1 diff -u /dev/null julius4/man/mkss.1:1.1 --- /dev/null Thu Oct 2 17:23:48 2008 +++ julius4/man/mkss.1 Thu Oct 2 17:23:47 2008 @@ -0,0 +1,65 @@ +.\" Title: + mkss + +.\" Author: +.\" Generator: DocBook XSL Stylesheets v1.71.0 +.\" Date: 10/02/2008 +.\" Manual: +.\" Source: +.\" +.TH "MKSS" "1" "10/02/2008" "" "" +.\" disable hyphenation +.nh +.\" disable justification (adjust text to left margin only) +.ad l +.SH "NAME" + + mkss + \- calculate average spectrum for spectral subtraction +.SH "SYNOPSIS" +.HP 5 +\fBmkss\fR [\fIoptions\fR...] {filename} +.SH "DESCRIPTION" +.PP + +\fBmkss\fR +is a tool to estimate noise spectrum for spectral subtraction on Julius. It reads a few seconds of sound data from microphone input, calculate the average spectrum and save it to a file. The output file can be used as a noise spectrum data in Julius (option "\fB\-ssload\fR"). +.PP +The recording will start immediately after startup. Sampling format is 16bit, monoral. If outpue file already exist, it will be overridden. +.SH "OPTIONS" +.PP +\fB \-freq \fR \fIHz\fR +.RS 3n +Sampling frequency in Hz (default: 16,000) +.RE +.PP +\fB \-len \fR \fImsec\fR +.RS 3n +capture length in milliseconds (default: 3000) +.RE +.PP +\fB \-fsize \fR \fIsample_num\fR +.RS 3n +frame size in number of samples (default: 400) +.RE +.PP +\fB \-fshift \fR \fIsample_num\fR +.RS 3n +frame shift in number of samples (default: 160) +.RE +.SH "SEE ALSO" +.PP + +\fB julius \fR( 1 ) +.SH "COPYRIGHT" +.PP +Copyright (c) 1997\-2000 Information\-technology Promotion Agency, Japan +.PP +Copyright (c) 1991\-2008 Kawahara Lab., Kyoto University +.PP +Copyright (c) 2000\-2005 Shikano Lab., Nara Institute of Science and Technology +.PP +Copyright (c) 2005\-2008 Julius project team, Nagoya Institute of Technology +.SH "LICENSE" +.PP +The same as Julius. Index: julius4/man/nextword.1 diff -u /dev/null julius4/man/nextword.1:1.1 --- /dev/null Thu Oct 2 17:23:48 2008 +++ julius4/man/nextword.1 Thu Oct 2 17:23:47 2008 @@ -0,0 +1,106 @@ +.\" Title: + nextword + +.\" Author: +.\" Generator: DocBook XSL Stylesheets v1.71.0 +.\" Date: 10/02/2008 +.\" Manual: +.\" Source: +.\" +.TH "NEXTWORD" "1" "10/02/2008" "" "" +.\" disable hyphenation +.nh +.\" disable justification (adjust text to left margin only) +.ad l +.SH "NAME" + + nextword + \- display next predicted words (in reverse order) +.SH "SYNOPSIS" +.HP 9 +\fBnextword\fR [\-t] [\-r] [\-s\ \fIspname\fR] [\-v] {prefix} +.SH "DESCRIPTION" +.PP +Given a partial (part of) sentence from the end, it outputs the next words allowed in the specified grammar. +.PP + +\fI.dfa\fR, +\fI.dict\fR +and +\fI.term\fR +files are needed to execute. They can be generated from +\fI.grammar\fR +and +\fI.voca\fR +file by +\fBmkdfa.pl\fR. +.PP +Please note that the latter part of sentence should be given, since the main 2nd pass does a right\-to\-left parsing. +.SH "OPTIONS" +.PP +\fB \-t \fR +.RS 3n +Input / Output in category name. (default: word) +.RE +.PP +\fB \-r \fR +.RS 3n +Enter in reverse order +.RE +.PP +\fB \-s \fR \fIspname\fR +.RS 3n +the name string of short\-pause word to be supressed (default: "sp") +.RE +.PP +\fB \-v \fR +.RS 3n +Debug output. +.RE +.SH "EXAMPLES" +.PP +Exmple output of a sample grammar "fruit": +.sp +.RS 3n +.nf +% \fBnextword\fR fruit +Stat: init_voca: read 36 words +Reading in term file (optional)...done +15 categories, 36 words +DFA has 26 nodes and 42 arcs +\-\-\-\-\- +command completion is disabled +\-\-\-\-\- +wseq > A BANANA +[wseq: A BANANA ] +[cate: (NUM_1|NUM_1|A|A) FRUIT_SINGULAR NS_E] +PREDICTED CATEGORIES/WORDS: + NS_B ( ) + HAVE (HAVE ) + WANT (WANT ) + NS_B ( ) + HAVE (HAVE ) + WANT (WANT ) +.fi +.RE +.sp +.SH "SEE ALSO" +.PP + +\fB mkdfa.pl \fR( 1 ) +, +\fB generate \fR( 1 ) +, +\fB accept_check \fR( 1 ) +.SH "COPYRIGHT" +.PP +Copyright (c) 1997\-2000 Information\-technology Promotion Agency, Japan +.PP +Copyright (c) 1991\-2008 Kawahara Lab., Kyoto University +.PP +Copyright (c) 2000\-2005 Shikano Lab., Nara Institute of Science and Technology +.PP +Copyright (c) 2005\-2008 Julius project team, Nagoya Institute of Technology +.SH "LICENSE" +.PP +The same as Julius. From sumomo @ users.sourceforge.jp Thu Oct 2 17:23:48 2008 From: sumomo @ users.sourceforge.jp (sumomo @ users.sourceforge.jp) Date: Thu, 02 Oct 2008 17:23:48 +0900 Subject: [Julius-cvs 313] CVS update: julius4/man/ja Message-ID: <1222935828.617355.32437.nullmailer@users.sourceforge.jp> Index: julius4/man/ja/accept_check.1 diff -u /dev/null julius4/man/ja/accept_check.1:1.1 --- /dev/null Thu Oct 2 17:23:48 2008 +++ julius4/man/ja/accept_check.1 Thu Oct 2 17:23:48 2008 @@ -0,0 +1,95 @@ +.\" Title: + accept_check + +.\" Author: +.\" Generator: DocBook XSL Stylesheets v1.71.0 +.\" Date: 10/02/2008 +.\" Manual: +.\" Source: +.\" +.TH "ACCEPT_CHECK" "1" "10/02/2008" "" "" +.\" disable hyphenation +.nh +.\" disable justification (adjust text to left margin only) +.ad l +.SH "名前" + + accept_check + \- 文法における単語列の受理/非受理チェック +.SH "概要" +.HP 13 +\fBaccept_check\fR [\-t] [\-s\ \fIspname\fR] [\-v] {prefix} +.SH "DESCRIPTION" +.PP +accept_check は,文法で文の受理・非受理を判定するツールです.文は標準 入力から与えます.受理すべき文を一行ずつテキストファイルにまとめて書い ておき,それをaccept_check の標準入力に与えることで,その文法 (\fIprefix.dfa\fR +および +\fIprefix.dict\fR) において目的の文が受理されるかどうかをバッチ的にチェックできます. +.PP +実行には .dfa, .dict, .term の各ファイルが必要です. あらかじめ +\fBmkdfa.pl\fR +で生成しておいて下さい. +.PP +対象とする文は,文法の語彙単位(.vocaの第1フィールド)で空白で区切って与 えます.最初と最後には多くの場合 +silB, +silE +が必要であることに気をつけて下さい.また, ショートポーズ単語は文に含めないでください. +.PP +同一表記の単語が複数ある場合,accept_check はその可能な解釈の全ての組 み合わせについて調べ,どれか1つのパターンでも受理可能であれば受理,す べてのパターンで受理不可能であれば受理不可能とします. +.SH "OPTIONS" +.PP +\fB \-t \fR +.RS 3n +単語ではなくカテゴリ名で入力・出力する. +.RE +.PP +\fB \-s \fR \fIspname\fR +.RS 3n +スキップすべきショートポーズ単語の名前を指定する. (default: "sp") +.RE +.PP +\fB \-v \fR +.RS 3n +デバッグ出力. +.RE +.SH "EXAMPLES" +.PP +vfr (フィッティングタスク用文法) での実行例: +.sp +.RS 3n +.nf +% accept_check vfr +Reading in dictionary...done +Reading in DFA grammar...done +Mapping dict item <\-> DFA terminal (category)...done +Reading in term file (optional)...done +42 categories, 99 words +DFA has 135 nodes and 198 arcs +\-\-\-\-\- +please input word sequence>silB 白 に して 下さい silE +wseq: silB 白 に して 下さい silE +cate: NS_B COLOR_N (NI|NI_AT) SURU_V KUDASAI_V NS_E +accepted +please input word sequence> +.fi +.RE +.sp +.SH "SEE ALSO" +.PP + +\fB mkdfa.pl \fR( 1 ) +, +\fB generate \fR( 1 ) +, +\fB nextword \fR( 1 ) +.SH "COPYRIGHT" +.PP +Copyright (c) 1991\-2008 京都大学 河原研究室 +.PP +Copyright (c) 1997\-2000 情報処理振興事業協会(IPA) +.PP +Copyright (c) 2000\-2008 奈良先端科学技術大学院大学 鹿野研究室 +.PP +Copyright (c) 2005\-2008 名古屋工業大学 Julius開発チーム +.SH "LICENSE" +.PP +Julius の使用許諾に準じます. Index: julius4/man/ja/adinrec.1 diff -u /dev/null julius4/man/ja/adinrec.1:1.1 --- /dev/null Thu Oct 2 17:23:48 2008 +++ julius4/man/ja/adinrec.1 Thu Oct 2 17:23:48 2008 @@ -0,0 +1,155 @@ +.\" Title: + adinrec + +.\" Author: +.\" Generator: DocBook XSL Stylesheets v1.71.0 +.\" Date: 10/02/2008 +.\" Manual: +.\" Source: +.\" +.TH "ADINREC" "1" "10/02/2008" "" "" +.\" disable hyphenation +.nh +.\" disable justification (adjust text to left margin only) +.ad l +.SH "名前" + + adinrec + \- 1発話の音声入力データをファイルに記録する +.SH "概要" +.HP 8 +\fBadinrec\fR [\fIoptions\fR...] {\fIfilename\fR} +.SH "DESCRIPTION" +.PP +adinrec は,音声区間を一定時間内の零交差数とパワー(振幅レベル)のしき い値に基づいて切り出し,ファイルに記録する.デフォルトでは標準デバイス を用いてマイク入力から録音するが,\fB\-input\fR +オプションで デバイスを選択可能である.またプラグイン入力も選択できる. +.PP +サンプリング周波数は任意に設定可能である.録音形式は 16bit, 1 channel であり,書き出されるファイル形式は Microsoft WAV 形式である. 既に同じ名前のファイルが存在する場合は上書きされる. +.PP +ファイル名に "\-" を指定すると取り込んだ音声データを標準出力へ出 力する.この場合データ形式は RAW 形式になる. +.SH "OPTIONS" +.PP +Julius の全てのオプションが指定可能である.指定されたもののうち, 音声入力に関係するオプションのみ扱われる.以下に,adinrec 独自の オプションと関係する Julius オプションに分けて解説する. +.SS "adinrec specific options" +.PP +\fB \-freq \fR \fIHz\fR +.RS 3n +音声のサンプリング周波数 (Hz) を指定する.(default: 16,000) +.RE +.PP +\fB \-raw \fR +.RS 3n +RAWファイル形式で出力する. +.RE +.SS "Concerning Julius options" +.PP +\fB \-input \fR {mic|rawfile|adinnet|stdin|netaudio|esd|alsa|oss} +.RS 3n +音声入力ソースを選択する.音声波形ファイルの場合は +fileあるいはrawfileを指 定する.起動後にプロンプトが表れるので,それに対してファイ ル名を入力する.adinnet +では, +adintool +などのクライアントプロセスから音声 データをネットワーク経由で受け取ることができる. +netaudio +はDatLinkのサーバから, +stdinは標準入力から音声入力を行う. +esdは,音声デバイスの共有手段として多くの Linuxのデスクトップ環境で利用されている EsounD daemon から入力する. +.RE +.PP +\fB \-lv \fR \fIthres\fR +.RS 3n +振幅レベルのしきい値.値は 0 から 32767 の範囲で指定する. (default: 2000) +.RE +.PP +\fB \-zc \fR \fIthres\fR +.RS 3n +零交差数のしきい値.値は1秒あたりの交差数で指定する. (default: 60) +.RE +.PP +\fB \-headmargin \fR \fImsec\fR +.RS 3n +音声区間開始部のマージン.単位はミリ秒. (default: 300) +.RE +.PP +\fB \-tailmargin \fR \fImsec\fR +.RS 3n +音声区間終了部のマージン.単位はミリ秒. (default: 400) +.RE +.PP +\fB \-zmean \fR +.RS 3n +入力音声ストリームに対して直流成分除去を行う.全ての音声処理の の前段として処理される. +.RE +.PP +\fB \-smpFreq \fR \fIHz\fR +.RS 3n +音声のサンプリング周波数 (Hz) を指定する.(default: 16,000) +.RE +.PP +\fB \-48 \fR +.RS 3n +48kHzで入力を行い,16kHzにダウンサンプリングする. これは 16kHz のモデルを使用しているときのみ有効である. ダウンダンプリングの内部機能は +sptk +から 移植された. (Rev. 4.0) +.RE +.PP +\fB \-NA \fR \fIdevicename\fR +.RS 3n +DatLink サーバのデバイス名 (\fB\-input netaudio\fR). +.RE +.PP +\fB \-adport \fR \fIport_number\fR +.RS 3n + +\fB\-input adinnet\fR +使用時,接続を受け付ける adinnet のボート番号を指定する.(default: 5530) +.RE +.PP +\fB \-nostrip \fR +.RS 3n +音声取り込み時,デバイスやファイルによっては,音声波形中に振幅 が "0" となるフレームが存在することがある.Julius は通常,音声 入力に含まれるそのようなフレームを除去する.この零サンプル除去が うまく動かない場合,このオプションを指定することで自動消去を 無効化することができる. +.RE +.PP +\fB \-C \fR \fIjconffile\fR +.RS 3n +jconf設定ファイルを読み込む.ファイルの内容がこの場所に展開される. +.RE +.PP +\fB \-plugindir \fR \fIdirlist\fR +.RS 3n +プラグインを読み込むディレクトリを指定する.複数の場合は コロンで区切って並べて指定する. +.RE +.SH "ENVIRONMENT VARIABLES" +.PP +\fB \fR\fB\fBALSADEV\fR\fR\fB \fR +.RS 3n +(マイク入力で alsa デバイス使用時) 録音デバイス名を指定する. 指定がない場合は "default". +.RE +.PP +\fB \fR\fB\fBAUDIODEV\fR\fR\fB \fR +.RS 3n +(マイク入力で oss デバイス使用時) 録音デバイス名を指定する. 指定がない場合は "\fI/dev/dsp\fR". +.RE +.PP +\fB \fR\fB\fBLATENCY_MSEC\fR\fR\fB \fR +.RS 3n +Linux (alsa/oss) および Windows で,マイク入力時の遅延時間をミ リ秒単位で指定する.短い値を設定することで入力遅延を小さくでき るが,CPU の負荷が大きくなり,また環境によってはプロセスやOSの 挙動が不安定になることがある.最適な値はOS やデバイスに大きく 依存する.デフォルト値は動作環境に依存する. +.RE +.SH "SEE ALSO" +.PP + +\fB julius \fR( 1 ) +, +\fB adintool \fR( 1 ) +.SH "COPYRIGHT" +.PP +Copyright (c) 1991\-2008 京都大学 河原研究室 +.PP +Copyright (c) 1997\-2000 情報処理振興事業協会(IPA) +.PP +Copyright (c) 2000\-2008 奈良先端科学技術大学院大学 鹿野研究室 +.PP +Copyright (c) 2005\-2008 名古屋工業大学 Julius開発チーム +.SH "LICENSE" +.PP +Julius の使用許諾に準じます. Index: julius4/man/ja/adintool.1 diff -u /dev/null julius4/man/ja/adintool.1:1.1 --- /dev/null Thu Oct 2 17:23:48 2008 +++ julius4/man/ja/adintool.1 Thu Oct 2 17:23:48 2008 @@ -0,0 +1,228 @@ +.\" Title: + adintool + +.\" Author: +.\" Generator: DocBook XSL Stylesheets v1.71.0 +.\" Date: 10/02/2008 +.\" Manual: +.\" Source: +.\" +.TH "ADINTOOL" "1" "10/02/2008" "" "" +.\" disable hyphenation +.nh +.\" disable justification (adjust text to left margin only) +.ad l +.SH "名前" + + adintool + \- 音声波形データの記録・分割・送信・受信ツール +.SH "概要" +.HP 9 +\fBadintool\fR {\-in\ \fIinputdev\fR} {\-out\ \fIoutputdev\fR} [\fIoptions\fR...] +.SH "DESCRIPTION" +.PP +adintool は,音声波形データ中の音声区間の検出および記録を連続的に行 うツールです.入力音声に対して零交差数と振幅レベルに基づく音声区間検 出を逐次行い,音声区間部分を連続出力します. +.PP +adintool は adinrec の高機能版です.音声データの入力元として,マイク 入力・ 音声波形ファイル・標準入力・ネットワーク入力(adinnet サーバー モード)が選択できます.Julius の +\fB\-input\fR +オプションも 使用可能で,プラグイン入力も選択できます. +.PP +出力先として,音声波形ファイル・標準出力・ネットワーク出力(adinnet ク ライアントモード)が選択できます.特にネットワーク出力(adinnet クライ アントモード)では, julius へネットワーク経由で音声を送信して音声認識 させることができます. +.PP +入力音声は音声区間ごとに自動分割され,逐次出力されます.音声区間の切 り出しには adinrec と同じ,一定時間内の零交差数とパワー(振幅レベル) のしきい値を用います.音声区間開始と同時に音声出力が開始されます.出 力としてファイル出力を選んだ場合は,連番ファイル名で検出された区間ごと に保存します. +.PP +サンプリング周波数は任意に設定可能です.録音形式は 16bit, 1 channel で,書き出されるファイル形式は Microsoft WAV 形式です. 既に同じ名前のファイルが存在する場合は上書きされます. +.SH "OPTIONS" +.PP +Julius の全てのオプションが指定可能である.指定されたもののうち, 音声入力に関係するオプションのみ扱われる.以下に,adintool の オプション,および有効な Julius オプションを解説する. +.SS "adintool specific options" +.PP +\fB \-freq \fR \fIHz\fR +.RS 3n +音声のサンプリング周波数 (Hz) を指定する.(default: 16,000) +.RE +.PP +\fB \-in \fR \fIinputdev\fR +.RS 3n +音声を読み込む入力デバイスを指定する."mic" でマイク入力, "file" でファイル入力, "stdin" で標準入力から音声を読み込む. ファイル入力の場合,ファイル名は起動後に出てくるプロンプトに対 して指定する.また,"adinnet" で adintool は adinnet サーバー となり,adinnet クライアントから音声データを tcp/ip 経由で 受け取る.ポート番号は 5530 である("\fB\-inport\fR" で変更可能). +.sp +入力デバイスは,そのほか Julius の "\-input" オプションでも指定可能 である.その場合,プラグインからの入力も可能である. +.RE +.PP +\fB \-out \fR \fIoutputdev\fR +.RS 3n +音声を出力するデバイスを指定する."file" でファイル出力, stdout で標準出力へ出力する.ファイルの場合,出力ファイル名は オプション "\fB\-filename\fR" で与える.出力ファイル 形式は 16bit WAV 形式である. また,"adinnet" で adintool は adinnet クライアント となり,adinnet サーバへ取り込んだ音声データを tcp/ip 経由で 送信できる.送信先ホストは "\fB\-server\fR" で指定する. ポート番号は 5530 である("\fB\-port\fR" で変更可能). +.RE +.PP +\fB \-inport \fR \fInum\fR +.RS 3n +入力が adinnet の場合 (\-in adinnet),接続を受けるポート番号 を指定する.指定しない場合のデフォルトは 5530 である. +.RE +.PP +\fB \-server \fR [host] [,host...] +.RS 3n +出力が adinnet の場合 (\-out adinnet),送信先のサーバ名を指定する. 複数ある場合は,カンマで区切って指定する. +.RE +.PP +\fB \-port \fR [num] [,num...] +.RS 3n +出力が adinnet の場合 (\-out adinnet),送信先の各サーバのポート番号 を指定する.指定しない場合のデフォルトは 5530 である. +\fB\-server\fR +で複数のサーバを指定している場合, 全てについて明示的にポート番号を指定する必要がある. +.RE +.PP +\fB \-filename \fR \fIfile\fR +.RS 3n +ファイル出力 (\fB\-out file\fR) 時,出力ファイル名を 与える.デフォルトでは,検出された音声区間検出ごとに, "\fIfile.0000.wav\fR" , "\fIfile.0001.wav\fR" ... のように区間ごとに連番で 記録される.番号の初期値は 0 である(\fB\-startid\fRで 変更可能).なお,オプション +\fB\-oneshot\fR +指定時は 最初の区間だけが "\fIfile\fR" の名前で保存される. +.RE +.PP +\fB \-startid \fR \fInumber\fR +.RS 3n +ファイル出力時,記録を開始する連番番号の初期値を指定する.( デフォルト:0) +.RE +.PP +\fB \-oneshot \fR +.RS 3n +最初の音声区間が終了したら終了する. +.RE +.PP +\fB \-nosegment \fR +.RS 3n +入力音声の音声区間検出(無音による区切りと無音区間のスキップ)を 行わない. +.RE +.PP +\fB \-raw \fR +.RS 3n +RAWファイル形式で出力する. +.RE +.PP +\fB \-autopause \fR +.RS 3n +出力が adinnet の場合(\-out adinnet),音声区間が終了するたび に入力停止・動作停止状態に移行する.出力先の adinnet サーバか ら動作再開信号がくると音声入力を再開する. +.RE +.PP +\fB \-loosesync \fR +.RS 3n +出力が adinnet (\-out adinnet)で複数の出力先サーバへ出力している 場合,動作停止状態から動作再開信号によって動作を再開する際,adintool は すべてのサーバから動作再開信号を受けるまで動作を再開しない. このオプションを指定すると,少なくとも1つのサーバから再開信号 がくれば動作を再開するようになる. +.RE +.PP +\fB \-rewind \fR \fImsec\fR +.RS 3n +入力がマイクのとき,停止状態から動作を再開するとき,停止中から 持続して音声入力中だった場合,指定されたミリ秒分だけさかのぼって 録音を開始する. +.RE +.SS "Concerning Julius options" +.PP +\fB \-input \fR {mic|rawfile|adinnet|stdin|netaudio|esd|alsa|oss} +.RS 3n +音声入力ソースを選択する."\-in" の代わりにこちらを使うことも できる(最後に指定したほうが優先される).esd やプラグイン入力が 指定可能である. +.RE +.PP +\fB \-lv \fR \fIthres\fR +.RS 3n +振幅レベルのしきい値.値は 0 から 32767 の範囲で指定する. (default: 2000) +.RE +.PP +\fB \-zc \fR \fIthres\fR +.RS 3n +零交差数のしきい値.値は1秒あたりの交差数で指定する. (default: 60) +.RE +.PP +\fB \-headmargin \fR \fImsec\fR +.RS 3n +音声区間開始部のマージン.単位はミリ秒. (default: 300) +.RE +.PP +\fB \-tailmargin \fR \fImsec\fR +.RS 3n +音声区間終了部のマージン.単位はミリ秒. (default: 400) +.RE +.PP +\fB \-zmean \fR +.RS 3n +入力音声ストリームに対して直流成分除去を行う.全ての音声処理の の前段として処理される. +.RE +.PP +\fB \-smpFreq \fR \fIHz\fR +.RS 3n +音声のサンプリング周波数 (Hz) を指定する.(default: 16,000) +.RE +.PP +\fB \-48 \fR +.RS 3n +48kHzで入力を行い,16kHzにダウンサンプリングする. これは 16kHz のモデルを使用しているときのみ有効である. ダウンダンプリングの内部機能は +sptk +から 移植された. (Rev. 4.0) +.RE +.PP +\fB \-NA \fR \fIdevicename\fR +.RS 3n +DatLink サーバのデバイス名 (\fB\-input netaudio\fR). +.RE +.PP +\fB \-adport \fR \fIport_number\fR +.RS 3n + +\fB\-input adinnet\fR +使用時,接続を受け付ける adinnet のボート番号を指定する.(default: 5530) +.RE +.PP +\fB \-nostrip \fR +.RS 3n +音声取り込み時,デバイスやファイルによっては,音声波形中に振幅 が "0" となるフレームが存在することがある.Julius は通常,音声 入力に含まれるそのようなフレームを除去する.この零サンプル除去が うまく動かない場合,このオプションを指定することで自動消去を 無効化することができる. +.RE +.PP +\fB \-C \fR \fIjconffile\fR +.RS 3n +jconf設定ファイルを読み込む.ファイルの内容がこの場所に展開される. +.RE +.PP +\fB \-plugindir \fR \fIdirlist\fR +.RS 3n +プラグインを読み込むディレクトリを指定する.複数の場合は コロンで区切って並べて指定する. +.RE +.SH "ENVIRONMENT VARIABLES" +.PP +\fB \fR\fB\fBALSADEV\fR\fR\fB \fR +.RS 3n +(マイク入力で alsa デバイス使用時) 録音デバイス名を指定する. 指定がない場合は "default". +.RE +.PP +\fB \fR\fB\fBAUDIODEV\fR\fR\fB \fR +.RS 3n +(マイク入力で oss デバイス使用時) 録音デバイス名を指定する. 指定がない場合は "\fI/dev/dsp\fR". +.RE +.PP +\fB \fR\fB\fBLATENCY_MSEC\fR\fR\fB \fR +.RS 3n +Linux (alsa/oss) および Windows で,マイク入力時の遅延時間をミ リ秒単位で指定する.短い値を設定することで入力遅延を小さくでき るが,CPU の負荷が大きくなり,また環境によってはプロセスやOSの 挙動が不安定になることがある.最適な値はOS やデバイスに大きく 依存する.デフォルト値は動作環境に依存する. +.RE +.SH "EXAMPLES" +.PP +マイクからの音声入力を,発話ごとに "data.0000.wav" から順に記録する: +.sp .RS 3n .nf % \fBadintool\fR \-in mic \-out file \-filename data .fi .RE +巨大な収録音声ファイル "foobar.raw" を,音声区間ごとに "foobar.1500.wav" "foobar.1501.wav" ... に分割する: +.sp .RS 3n .nf % \fBadintool\fR \-in file \-out file \-filename foobar \-startid 1500 % enter filename\->foobar.raw .fi .RE +ネットワーク経由で音声ファイルを転送する(区間検出なし): +.sp .RS 3n .nf (sender) % \fBadintool\fR \-in file \-out adinnet \-server \fIreceiver_hostname\fR \-nosegment (receiver) % \fBadintool\fR \-in adinnet \-out file \-nosegment .fi .RE +マイクからの入力音声を Julius へ送信して認識: +.sp .RS 3n .nf (sender) % \fBadintool\fR \-in mic \-out adinnet \-server \fIreceiver_hostname\fR (receiver) % \fBjulius\fR \-C ... \-input adinnet .fi .RE +.SH "SEE ALSO" +.PP + +\fB julius \fR( 1 ) +, +\fB adinrec \fR( 1 ) +.SH "COPYRIGHT" +.PP +Copyright (c) 1991\-2008 京都大学 河原研究室 +.PP +Copyright (c) 1997\-2000 情報処理振興事業協会(IPA) +.PP +Copyright (c) 2000\-2008 奈良先端科学技術大学院大学 鹿野研究室 +.PP +Copyright (c) 2005\-2008 名古屋工業大学 Julius開発チーム +.SH "LICENSE" +.PP +Julius の使用許諾に準じます. Index: julius4/man/ja/dfa_determinize.1 diff -u /dev/null julius4/man/ja/dfa_determinize.1:1.1 --- /dev/null Thu Oct 2 17:23:48 2008 +++ julius4/man/ja/dfa_determinize.1 Thu Oct 2 17:23:48 2008 @@ -0,0 +1,65 @@ +.\" Title: + dfa_determinize + +.\" Author: +.\" Generator: DocBook XSL Stylesheets v1.71.0 +.\" Date: 10/02/2008 +.\" Manual: +.\" Source: +.\" +.TH "DFA_DETERMINIZE" "1" "10/02/2008" "" "" +.\" disable hyphenation +.nh +.\" disable justification (adjust text to left margin only) +.ad l +.SH "名前" + + dfa_determinize + \- 有限オートマトン文法を決定化する +.SH "概要" +.HP 16 +\fBdfa_determinize\fR [\-o\ \fIoutfile\fR] {dfafile} +.SH "DESCRIPTION" +.PP +dfa_determinize は,.dfa ファイルを等価な決定性 .dfa ファイルに変換し, 標準出力に出力します.オプション +\fB\-o\fR +で出力先を 指定することもできます. +.PP + +\fBmkdfa.pl\fR +が生成するDFAは常に決定化されており, 通常,\fBmkdfa.pl\fR +で作成された .dfa ファイルに対して このツールを使う必要はありません. +.SH "OPTIONS" +.PP +\fB \-o \fR \fIoutfile\fR +.RS 3n +出力ファイル名を指定する. +.RE +.SH "EXAMPLES" +.PP + +\fIfoo.dfa\fR +を決定化して +\fIbar.dfa\fR +に 保存する. +.sp .RS 3n .nf % \fBdfa_determinize\fR \-o bar.dfa foo.dfa .fi .RE +別の方法: +.sp .RS 3n .nf % \fBdfa_determinize\fR < foo.dfa > bar.dfa .fi .RE +.SH "SEE ALSO" +.PP + +\fB mkdfa.pl \fR( 1 ) +, +\fB dfa_minimize \fR( 1 ) +.SH "COPYRIGHT" +.PP +Copyright (c) 1991\-2008 京都大学 河原研究室 +.PP +Copyright (c) 1997\-2000 情報処理振興事業協会(IPA) +.PP +Copyright (c) 2000\-2008 奈良先端科学技術大学院大学 鹿野研究室 +.PP +Copyright (c) 2005\-2008 名古屋工業大学 Julius開発チーム +.SH "LICENSE" +.PP +Julius の使用許諾に準じます. Index: julius4/man/ja/dfa_minimize.1 diff -u /dev/null julius4/man/ja/dfa_minimize.1:1.1 --- /dev/null Thu Oct 2 17:23:48 2008 +++ julius4/man/ja/dfa_minimize.1 Thu Oct 2 17:23:48 2008 @@ -0,0 +1,64 @@ +.\" Title: + dfa_minimize + +.\" Author: +.\" Generator: DocBook XSL Stylesheets v1.71.0 +.\" Date: 10/02/2008 +.\" Manual: +.\" Source: +.\" +.TH "DFA_MINIMIZE" "1" "10/02/2008" "" "" +.\" disable hyphenation +.nh +.\" disable justification (adjust text to left margin only) +.ad l +.SH "名前" + + dfa_minimize + \- 有限オートマトン文法を最小化する +.SH "概要" +.HP 13 +\fBdfa_minimize\fR [\-o\ \fIoutfile\fR] {dfafile} +.SH "DESCRIPTION" +.PP +dfa_minimize は,.dfa ファイルを等価な最小化の .dfa ファイルに変換し, 標準出力に出力します.オプション +\fB\-o\fR +で出力先を 指定することもできます. +.PP +バージョン 3.5.3 以降の Julius に付属の +\fBmkdfa.pl\fR +は, このツールを内部で自動的に呼び出すので,出力される .dfa は常に最小化 されており,これを単体で実行する必要はありません.バージョン 3.5.2 以前の +\fBmkdfa.pl\fR +で出力された .dfa は最小化されていないので, このツールで最小化するとサイズを最適化することができます. +.SH "OPTIONS" +.PP +\fB \-o \fR \fIoutfile\fR +.RS 3n +出力ファイル名を指定する. +.RE +.SH "EXAMPLES" +.PP + +\fIfoo.dfa\fR +を最小化して +\fIbar.dfa\fR +に 保存する. +.sp .RS 3n .nf % \fBdfa_minimize\fR \-o bar.dfa foo.dfa .fi .RE +別の方法: +.sp .RS 3n .nf % \fBdfa_minimize\fR < foo.dfa > bar.dfa .fi .RE +.SH "SEE ALSO" +.PP + +\fB mkdfa.pl \fR( 1 ) +.SH "COPYRIGHT" +.PP +Copyright (c) 1991\-2008 京都大学 河原研究室 +.PP +Copyright (c) 1997\-2000 情報処理振興事業協会(IPA) +.PP +Copyright (c) 2000\-2008 奈良先端科学技術大学院大学 鹿野研究室 +.PP +Copyright (c) 2005\-2008 名古屋工業大学 Julius開発チーム +.SH "LICENSE" +.PP +Julius の使用許諾に準じます. Index: julius4/man/ja/generate-ngram.1 diff -u /dev/null julius4/man/ja/generate-ngram.1:1.1 --- /dev/null Thu Oct 2 17:23:48 2008 +++ julius4/man/ja/generate-ngram.1 Thu Oct 2 17:23:48 2008 @@ -0,0 +1,79 @@ +.\" Title: + generate\-ngram + +.\" Author: +.\" Generator: DocBook XSL Stylesheets v1.71.0 +.\" Date: 10/02/2008 +.\" Manual: +.\" Source: +.\" +.TH "GENERATE\-NGRAM" "1" "10/02/2008" "" "" +.\" disable hyphenation +.nh +.\" disable justification (adjust text to left margin only) +.ad l +.SH "名前" + + generate\-ngram + \- N\-gram に従って文をランダム生成する +.SH "概要" +.HP 15 +\fBgenerate\-ngram\fR [\fIoptions\fR...] {\fIbinary_ngram\fR} +.SH "DESCRIPTION" +.PP +generate\-ngram は,与えられた N\-gram 確率に従って文をランダム生成する ツールです.\fIbinary_ngram\fR +には, バイナリ形式の N\-gram ファイルを指定します. +.SH "OPTIONS" +.PP +\fB \-n \fR \fInum\fR +.RS 3n +生成する文数を指定する(デフォルト:10) +.RE +.PP +\fB \-N \fR +.RS 3n +使用する N\-gram の長さを制限する(デフォルト:与えられたモデルで定義されている最大値,3\-gram なら 3). +.RE +.PP +\fB \-bos \fR +.RS 3n +文開始記号を指定する(デフォルト:) +.RE +.PP +\fB \-eos \fR +.RS 3n +文終了記号を指定する(デフォルト:) +.RE +.PP +\fB \-ignore \fR +.RS 3n +出力してほしくない単語を指定する(デフォルト:) +.RE +.PP +\fB \-v \fR +.RS 3n +冗長な出力を行う. +.RE +.PP +\fB \-debug \fR +.RS 3n +デバッグ用出力を行う. +.RE +.SH "SEE ALSO" +.PP + +\fB julius \fR( 1 ) +, +\fB mkbingram \fR( 1 ) +.SH "COPYRIGHT" +.PP +Copyright (c) 1991\-2008 京都大学 河原研究室 +.PP +Copyright (c) 1997\-2000 情報処理振興事業協会(IPA) +.PP +Copyright (c) 2000\-2008 奈良先端科学技術大学院大学 鹿野研究室 +.PP +Copyright (c) 2005\-2008 名古屋工業大学 Julius開発チーム +.SH "LICENSE" +.PP +Julius の使用許諾に準じます. Index: julius4/man/ja/generate.1 diff -u /dev/null julius4/man/ja/generate.1:1.1 --- /dev/null Thu Oct 2 17:23:48 2008 +++ julius4/man/ja/generate.1 Thu Oct 2 17:23:48 2008 @@ -0,0 +1,94 @@ +.\" Title: + generate + +.\" Author: +.\" Generator: DocBook XSL Stylesheets v1.71.0 +.\" Date: 10/02/2008 +.\" Manual: +.\" Source: +.\" +.TH "GENERATE" "1" "10/02/2008" "" "" +.\" disable hyphenation +.nh +.\" disable justification (adjust text to left margin only) +.ad l +.SH "名前" + + generate + \- 文法から文をランダム生成する +.SH "概要" +.HP 9 +\fBgenerate\fR [\-v] [\-t] [\-n\ \fInum\fR] [\-s\ \fIspname\fR] {prefix} +.SH "DESCRIPTION" +.PP +generate は文法に従って文をランダムに生成します. +.PP +実行には .dfa, .dict, .term の各ファイルが必要です. あらかじめ +\fBmkdfa.pl\fR +で生成しておいて下さい. +.SH "OPTIONS" +.PP +\fB \-t \fR +.RS 3n +単語ではなくカテゴリ名で出力する. +.RE +.PP +\fB \-n \fR \fInum\fR +.RS 3n +生成する文の数を指定する (default: 10) +.RE +.PP +\fB \-s \fR \fIspname\fR +.RS 3n +生成においてスキップすべきショートポーズ単語の名前を指定する. (default: "sp") +.RE +.PP +\fB \-v \fR +.RS 3n +デバッグ出力. +.RE +.SH "EXAMPLES" +.PP +vfr (フィッティングタスク用文法) での実行例: +.sp +.RS 3n +.nf +% generate vfr +Reading in dictionary...done +Reading in DFA grammar...done +Mapping dict item <\-> DFA terminal (category)...done +Reading in term file (optional)...done +42 categories, 99 words +DFA has 135 nodes and 198 arcs + \-\-\-\-\- +silB やめます silE +silB 終了します silE +silB シャツ を スーツ と 統一して 下さい silE +silB スーツ を カッター と 同じ 色 に 統一して 下さい silE +silB 交換して 下さい silE +silB これ を 覚えておいて 下さい silE +silB 覚えておいて 下さい silE +silB 戻って 下さい silE +silB スーツ を シャツ と 統一して 下さい silE +silB 上着 を 橙 に して 下さい silE +.fi +.RE +.sp +.SH "SEE ALSO" +.PP + +\fB mkdfa.pl \fR( 1 ) +, +\fB generate\-ngram \fR( 1 ) +.SH "COPYRIGHT" +.PP +Copyright (c) 1991\-2008 京都大学 河原研究室 +.PP +Copyright (c) 1997\-2000 情報処理振興事業協会(IPA) +.PP +Copyright (c) 2000\-2008 奈良先端科学技術大学院大学 鹿野研究室 +.PP +Copyright (c) 2005\-2008 名古屋工業大学 Julius開発チーム +.SH "LICENSE" +.PP +Julius の使用許諾に準じます. Index: julius4/man/ja/gram2sapixml.pl.1 diff -u /dev/null julius4/man/ja/gram2sapixml.pl.1:1.1 --- /dev/null Thu Oct 2 17:23:48 2008 +++ julius4/man/ja/gram2sapixml.pl.1 Thu Oct 2 17:23:48 2008 @@ -0,0 +1,55 @@ +.\" Title: + gram2sapixml.pl + +.\" Author: +.\" Generator: DocBook XSL Stylesheets v1.71.0 +.\" Date: 10/02/2008 +.\" Manual: +.\" Source: +.\" +.TH "GRAM2SAPIXML.PL" "1" "10/02/2008" "" "" +.\" disable hyphenation +.nh +.\" disable justification (adjust text to left margin only) +.ad l +.SH "名前" + + gram2sapixml.pl + \- 認識用文法を SAPI XML 文法に変換するスクリプト +.SH "概要" +.HP 16 +\fBgram2sapixml.pl\fR [\fIprefix\fR...] +.SH "DESCRIPTION" +.PP +gram2sapixml.pl は,Julius の認識用文法ファイル (.grammar, .voca) から Microsoft SAPI XML 形式へ変換するスクリプトです. +\fIprefix\fR +には,変換する .grammar, .voca ファ イルのファイル名から拡張子を除外したものを指定します.複数指定した場合, それらは逐次変換されます. +.PP +入力文字コードは EUC\-JPを想定しています.出力ファイルは UTF\-8 エンコー ディングです.コード変換のため内部で +\fBiconv\fR +を使用 しています. +.PP +左再帰性については手作業による修正が必要です.元ファイルの .grammar の 構造をそのまま保持するため,.grammar における正順での左再帰記述がその まま .xml に反映されます.したがって,変換後 .xml に含まれる左再帰性の 解決は手作業で行わなければいけません. +.SH "SEE ALSO" +.PP + +\fB mkdfa.pl \fR( 1 ) +.SH "DIAGNOSTICS" +.PP +変換は,元ファイルの文法の非終端記号と終端記号(単語カテゴリ名)をルール に変換するという単純なものです.実際にSAPIアプリケーションで使う場合に は,プロパティを指定するなど,手作業での修正が必要です. +.PP +内部でコード変換に +\fBiconv\fR +を使用しています. 実行パス上に iconv が無い場合,エラーとなります. +.SH "COPYRIGHT" +.PP +Copyright (c) 1991\-2008 京都大学 河原研究室 +.PP +Copyright (c) 1997\-2000 情報処理振興事業協会(IPA) +.PP +Copyright (c) 2000\-2008 奈良先端科学技術大学院大学 鹿野研究室 +.PP +Copyright (c) 2005\-2008 名古屋工業大学 Julius開発チーム +.SH "LICENSE" +.PP +Julius の使用許諾に準じます. Index: julius4/man/ja/jclient.pl.1 diff -u /dev/null julius4/man/ja/jclient.pl.1:1.1 --- /dev/null Thu Oct 2 17:23:48 2008 +++ julius4/man/ja/jclient.pl.1 Thu Oct 2 17:23:48 2008 @@ -0,0 +1,44 @@ +.\" Title: + jclient.pl + +.\" Author: +.\" Generator: DocBook XSL Stylesheets v1.71.0 +.\" Date: 10/02/2008 +.\" Manual: +.\" Source: +.\" +.TH "JCLIENT.PL" "1" "10/02/2008" "" "" +.\" disable hyphenation +.nh +.\" disable justification (adjust text to left margin only) +.ad l +.SH "名前" + + jclient.pl + \- perl 版サンプルクライアント +.SH "概要" +.HP 11 +\fBjclient.pl\fR +.SH "DESCRIPTION" +.PP +Julius に付属のサンプルクライアント "jcontrol" の Perl 版です. モジュール(サーバ)モードで動く Julius から認識結果を受け取ったり, Julius を制御したりできます. +.PP +わずか 57 行の簡単なプログラムです.アプリケーションへ Julius を組み込 む際の参考になれば幸いです.ご自由にご利用ください。 +.SH "EXAMPLES" +.PP .RS 3n .nf % \fBjulius\fR \-C ... \-module .fi .RE +上記のようにして Julius をモジュールモードで起動した後,jclient.pl を 起動します.接続するホストのデフォルトは localhost, ポート番号は 10500 です.変えたい場合はスクリプトの冒頭を書き換えてください. +.sp .RS 3n .nf % \fBjclient.pl\fR .fi .RE +音声入力を行えば,イベント内容や結果が jclient.pl 側に送信され, 標準出力に出力されます.また,jclient.pl に対してコマンドを入力する (最後に Enter を押す)と,Julius にコマンドが送信され,Julius が制御されます. コマンドは,仕様書にあるモジュールコマンドを生のまま記述します. +.SH "SEE ALSO" +.PP + +\fB julius \fR( 1 ) +, +\fB jcontrol \fR( 1 ) +.SH "COPYRIGHT" +.PP +jclient.pl は 西村竜一 さん (nisimura @ sys.wakayama\-u.ac.jp) によって作 成されました.本プログラムのご利用に関しては,作者は一切の保証をしませ ん.各自の責任のもとでご利用ください. +.PP +感想、御意見、御要望などのフィードバックは歓迎いたしますので, 上記メールアドレス,または下記ホームページへ御連絡ください. +.PP +http://w3voice.jp/ Index: julius4/man/ja/jcontrol.1 diff -u /dev/null julius4/man/ja/jcontrol.1:1.1 --- /dev/null Thu Oct 2 17:23:48 2008 +++ julius4/man/ja/jcontrol.1 Thu Oct 2 17:23:48 2008 @@ -0,0 +1,193 @@ +.\" Title: + jcontrol + +.\" Author: +.\" Generator: DocBook XSL Stylesheets v1.71.0 +.\" Date: 10/02/2008 +.\" Manual: +.\" Source: +.\" +.TH "JCONTROL" "1" "10/02/2008" "" "" +.\" disable hyphenation +.nh +.\" disable justification (adjust text to left margin only) +.ad l +.SH "名前" + + jcontrol + \- Juliusモジュールモード用のサンプルクライアント +.SH "概要" +.HP 9 +\fBjcontrol\fR {\fIhostname\fR} [\fIportnum\fR] +.SH "DESCRIPTION" +.PP +jcontrol は,モジュールモードで動作している julius に接続し,APIを介し てコントロールする簡単なコンソールプログラムです.Julius への一時停止 や再開などのコマンドの送信,および Julius からの認識結果や音声イベントの メッセージ受信を行うことができます. +.PP +起動後,jcontrol は,指定ホスト上において「モジュールモード」で動作中 のJulius に対し,接続を試みます.接続確立後,jcontrol はユーザーからの コマンド入力およびメッセージ受信待ち状態となります. +.PP +jcontrol は ユーザーが入力したコマンドを解釈し,対応するAPIコマンドを Julius へ送信します.また,Julius から認識結果や入力トリガ情報 など のメッセージが送信されてきたときは,その内容を標準出力へ書き出します. +.PP +モジュールモードの仕様については,関連文書をご覧下さい. +.SH "OPTIONS" +.PP +\fB hostname \fR +.RS 3n +接続先のホスト名 +.RE +.PP +\fB portnum \fR +.RS 3n +ポート番号(デフォルト:10500) +.RE +.SH "COMMANDS" +.PP +jcontrol は標準入力から1行ずつコマンド文字列を受け取る. コマンドの一覧は以下の通り. +.SS "動作制御" +.PP +pause +.RS 3n +Juliusの認識動作を中断させ,一時停止状態に移行させる.一時停止状 態にあるJuliusは,たとえ音声入力があっても認識処理を行わない. ある区間の音声認識処理の途中でこのコマンドを受け取った場合, Julius はその認識処理が終了した後,一時停止状態に移行する. +.RE +.PP +terminate +.RS 3n + +pauseと同じく,Juliusの認識動作を中断させ, 一時停止状態に移行させる.ある区間の音声認識処理の途中でこのコ マンドを受け取った場合,その入力を破棄して即座に一時停止状態に 移行する. +.RE +.PP +resume +.RS 3n +Julius を一時停止状態から通常状態へ移行させ,認識を再開させる. +.RE +.PP +inputparam \fIarg\fR +.RS 3n +文法切り替え時に音声入力であった場合の入力中音声の扱いを指定. "TERMINATE", "PAUSE", "WAIT"のうちいずれかを指定. +.RE +.PP +version +.RS 3n +Julius にバージョン文字列を返させる. +.RE +.PP +status +.RS 3n +Julius からシステムの状態 (active / sleep) を報告させる. +.RE +.SS "文法・単語認識関連" +.PP +changegram \fIprefix\fR +.RS 3n +認識文法を "\fIprefix.dfa\fR" と "\fIprefix.dict\fR" に切り替える.カレントプロ セス内の文法は全て消去され,指定された文法に置き換わる. +.RE +.PP +addgram \fIprefix\fR +.RS 3n +認識文法として "\fIprefix.dfa\fR" と "\fIprefix.dict\fR" をカレントプロセスに追加する. +.RE +.PP +deletegram \fIgramlist\fR +.RS 3n +カレントプロセスから指定された文法を削除する.文法の指定は,文 法名(追加時の +\fIprefix\fR)か,あるいは Julius から送られる +GRAMINFO内にある文法 ID で指定する.複数の文法を削除したい場合は,文法名もしくはIDをカ ンマで区切って複数指定する(IDと文法名が混在してもよい). +.RE +.PP +deactivategram \fIgramlist\fR +.RS 3n +カレントプロセスの指定された文法を一時的に無効にする.無効にされた 文法は,エンジン内に保持されたまま,認識処理からは一時的に除外される. 無効化された文法は +activategram +で再び有効化できる. +.sp +文法の指定は,文法名(追加時の +\fIprefix\fR)か,あるいはJulius から送ら れる +GRAMINFO内にある文法 ID で指定する.複 数の文法を指定したい場合は,文法名もしくはIDをカンマで区切って 複数指定する(IDと文法名が混在してもよい). +.RE +.PP +activategram \fIgramlist\fR +.RS 3n +カレントプロセスで無効化されている文法を有効化する. 文法の指定は,文法名(追加時の +\fIprefix\fR)か,あるいはJulius から送ら れる +GRAMINFO内にある文法 ID で指定する.複 数の文法を指定したい場合は,文法名もしくはIDをカンマで区切って 複数指定する(IDと文法名が混在してもよい). +.RE +.PP +addword \fIgrammar_name_or_id\fR \fIdictfile\fR +.RS 3n +dictfile の中身を,カレントプロセスの指定された文法に追加する. +.RE +.PP +syncgram +.RS 3n +addgram や deletegram などによる文法の更新を即時に行う. 同期確認用である. +.RE +.SS "プロセス関連のコマンド" +.PP +Julius\-4 では複数モデルの同時認識が行える.この場合, 認識プロセス ("\fB\-SR\fR" で指定された認識処理インスタンス) ごとにモジュールクライアントから操作を行うことができる. +.PP +クライアントからはどれか一つのプロセスが「カレントプロセス」として 割り当てられる.文法関連の命令はカレントプロセスに対して行われる. +.PP +listprocess +.RS 3n +Julius に現在エンジンにある認識プロセスの一覧を送信させる. +.RE +.PP +currentprocess \fIprocname\fR +.RS 3n +カレントプロセスを指定された名前のプロセスに切り替える. +.RE +.PP +shiftprocess +.RS 3n +カレントプロセスを循環切り替えする.呼ばれるたびにその次のプロセスに カレントプロセスが切り替わる. +.RE +.PP +addprocess \fIjconffile\fR +.RS 3n +エンジンに認識プロセスを新たに追加する.与える +\fIjconffile\fR +は,通常のものと違い, ただ一種類の LM 設定を含むものである必要がある.また,実際に送られる のはパス名のみであり,ファイル読み込みはJulius側で行われるため, ファイルパスは Julius から見える場所を指定する必要が有る. +.sp +追加された LM および認識プロセスは,jconffile の名前が プロセス名となる. +.RE +.PP +delprocess \fIprocname\fR +.RS 3n +指定された名前の認識プロセスをエンジンから削除する. +.RE +.PP +deactivateprocess \fIprocname\fR +.RS 3n +指定された名前の認識プロセスを,一時的に無効化する.無効化され たプロセスは次回以降の入力に対して認識処理からスキップされる. 無効化されたプロセスは +activateprocess +で 再び有効化できる. +.RE +.PP +activateprocess \fIprocname\fR +.RS 3n +指定された名前の認識プロセスを有効化する. +.RE +.SH "EXAMPLES" +.PP +Julius からのメッセージは "> " を行の先頭につけてそのまま標準出力に出力 されます.以下は実行例です. +.sp .RS 3n .nf % \fBjulius\fR \-C ... \-module .fi .RE +上記のようにして Julius をモジュールモードで起動した後, jcontrol をそのホスト名を指定して起動します. +.sp .RS 3n .nf % \fBjcontrol\fR hostname .fi .RE +音声入力を行えば,イベント内容や結果が jcontrol 側に送信されます. jcontrol に対してコマンドを入力する(最後に Enter を押す)と, Julius にコマンドが送信され,Julius が制御されます. +.PP +詳しいプロトコルについては,関連文書を参照してください. +.SH "SEE ALSO" +.PP + +\fB julius \fR( 1 ) +.SH "COPYRIGHT" +.PP +Copyright (c) 1991\-2008 京都大学 河原研究室 +.PP +Copyright (c) 1997\-2000 情報処理振興事業協会(IPA) +.PP +Copyright (c) 2000\-2008 奈良先端科学技術大学院大学 鹿野研究室 +.PP +Copyright (c) 2005\-2008 名古屋工業大学 Julius開発チーム +.SH "LICENSE" +.PP +Julius の使用許諾に準じます. Index: julius4/man/ja/julius.1 diff -u /dev/null julius4/man/ja/julius.1:1.1 --- /dev/null Thu Oct 2 17:23:48 2008 +++ julius4/man/ja/julius.1 Thu Oct 2 17:23:48 2008 @@ -0,0 +1,1324 @@ +.\" Title: + julius + +.\" Author: +.\" Generator: DocBook XSL Stylesheets v1.71.0 +.\" Date: 10/02/2008 +.\" Manual: +.\" Source: +.\" +.TH "JULIUS" "1" "10/02/2008" "" "" +.\" disable hyphenation +.nh +.\" disable justification (adjust text to left margin only) +.ad l +.SH "名前" + + julius + \- 大語彙連続音声認識エンジン +.SH "概要" +.HP 7 +\fBjulius\fR [\-C\ \fIjconffile\fR] [\fIoptions\fR...] +.SH "内容" +.PP +Julius は数万語を対象とした大語彙連続音声認識を行うことのできるフリー の認識エンジンです.単語N\-gramを用いた2パス構成の段階的探索により高精 度な認識を行うことができます.また,小規模語彙のための文法ベースの認識 や単単語認識も行うことができます.認識対象としてマイク入力,録音済みの 音声波形ファイル,特徴抽出したパラメータファイルなどに対応しています. +.PP +コアの認識処理は,全て JuliusLib ライブラリとして提供されています. JuliusはJuliusLibを用いる音声アプリケーションの一つです. +.PP +Julius を用いて音声認識を行うには,音響モデル,単語辞書,および言語モ デルが必要です. +.SH "設定" +.PP +Julius および JuliusLib コアエンジンの設定(動作選択,設定,モデル指定, パラメータ変更など)は,すべてここで説明する「オプション」で指定する. Julius に対しては,これらのオプションをコマンドライン引数として直接指 定するか,あるいはテキストファイル内に記述したものを "\fB\-C\fR" につづけて指定する.このオプションを記述したテキストファイルは "jconf 設定ファイル" と呼ばれる. +.PP +JuliusLib を用いる他のアプリケーションにおいても,JuliusLib内の認識 エンジンへの動作指定は,同様にこのオプション群で行う.jconf 設定ファイル に設定内容を記述して,それをメイン関数の最初で +\fBj_config_load_file_new(char *jconffile);\fR +で呼び出 すことで,JuliusLib 内の認識エンジンに設定をセットすることができる. +.PP +なお,jconf 設定ファイル内では,相対ファイルパスはその jconf ファイル の位置からの相対パスとして解釈される(カレントディレクトリではない). 注意されたい. +.PP +以下に各オプションを解説する. +.SS "Julius アプリケーションオプション" +.PP +.PP +JuliusLib とは独立した,アプリケーションとしての Julius の機能に関する オプションである.認識結果の出力,文字コード変換,ログの設定,モジュー ルモードなどを含む.これらのオプションは,JuliusLib を組み込んだ他のア プリケーションでは使用できないので注意すること. +.PP +\fB \-outfile \fR +.RS 3n +認識結果を個別のファイルに出力する.入力ファイルごとの認識結果を, その拡張子を ".out" に変えたファイルに保存する. (rev. 4.0) +.RE +.PP +\fB \-separatescore \fR +.RS 3n +認識結果で言語スコアと音響スコアを個別に出力する.指定しない場 合,和の値が認識結果のスコアとして出力される. +.RE +.PP +\fB \-callbackdebug \fR +.RS 3n +コールバックがJuliusLibから呼ばれたときにコールバック名を 標準出力に出力する.デバッグ用である.(rev.4.0) +.RE +.PP +\fB \-charconv \fR \fIfrom\fR \fIto\fR +.RS 3n +出力で文字コードの変換を行う.\fIfrom\fR +は言語モデルの文字セットを,\fIto\fR +は出 力の文字セットを指定する.文字セットは,Linux では +iconv +で用いられるコード名である.Windows では,コードページ番号あるいはいかに示すコード名のどれかである: +ansi, +mac, +oem, +utf\-7, +utf\-8, +sjis, +euc. +.RE +.PP +\fB \-nocharconv \fR +.RS 3n +文字コード変換を行わない.\fB\-charconv\fR +の指定を リセットする. +.RE +.PP +\fB \-module \fR [port] +.RS 3n +Julius を「サーバモジュールモード」で起動する.TCP/IP 経由でク ライアンとやりとりし,処理の制御や認識結果・イベントの通知が行 える.port +はポート番号であり,省略時は 10500 が用いられる. +.RE +.PP +\fB \-record \fR \fIdir\fR +.RS 3n +区間検出された入力音声をファイルに逐次保存する. +\fIdir\fRは保存するディレクトリを指定する. ファイル名は,それぞれの処理終了時のシステム時間から +YYYY.MMDD.HHMMSS.wavの形で保存される.ファ イル形式は16bit, 1チャンネルのWAV形式である. なお,入力がGMM等によって棄却された場合も記録される. +.RE +.PP +\fB \-logfile \fR \fIfile\fR +.RS 3n +通常 Julius は全てのログ出力を標準出力に出力する. このオプションを指定することで,それらの出力を指定ファイルに 切替えることができる.(Rev.4.0) +.RE +.PP +\fB \-nolog \fR +.RS 3n +ログ出力を禁止する.標準出力には何も出力されなくなる. (Rev.4.0) +.RE +.PP +\fB \-help \fR +.RS 3n +エンジン設定,オプション一覧などのヘルプを出力して終了する. +.RE +.SS "全体オプション" +.PP +全体オプションは,モデルや探索以外のオプションであり, 音声入力・音検出・GMM・プラグイン・その他の設定を含む. 全体オプションは, 音響モデル(\fB\-AM\fR)・言語モデル(\fB\-LM\fR)・デ コーダ(\fB\-SR\fR)などのセクション定義の前に定義するか, +\fB\-GLOBAL\fR +のあとに指定する. +.sp +.it 1 an-trap +.nr an-no-space-flag 1 +.nr an-break-flag 1 +.br +\fBオーディオ入力\fR +.RS +.PP +\fB \-input \fR {mic|rawfile|mfcfile|adinnet|stdin|netaudio|esd|alsa|oss} +.RS 3n +音声入力ソースを選択する.音声波形ファイルの場合は +fileあるいはrawfileを指 定する.HTK +形式の特徴量ファイルを認識する場合は +htkparamあるいはmfcfile +を指定する.起動後にプロンプトが表れるので,それに対してファイ ル名を入力する.adinnet +では, +adintool +などのクライアントプロセスから音声 データをネットワーク経由で受け取ることができる. +netaudio +はDatLinkのサーバから, +stdinは標準入力からの音声入力を認識する. +esdは,音声デバイスの共有手段として多くの Linuxのデスクトップ環境で利用されている EsounD daemon からの入 力を認識する. +.RE +.PP +\fB \-filelist \fR \fIfilename\fR +.RS 3n +(\fB\-input rawfile|mfcfile\fR +時) +\fIfilename\fR内に列挙されている全てのファ イルについて認識を順次行う. +\fIfilename\fRには認識する入力ファイル名 を1行に1つずつ記述する. +.RE +.PP +\fB \-notypecheck \fR +.RS 3n +入力の特徴量ベクトルの型チェックを無効にする.通常 Julius は入 力の型が音響モデルとマッチするかどうかをチェックし,マッチしない とエラー終了する.このオプションはそのチェックを回避する.なんらかの 理由で型チェックがうまく動作しないときに使用する. +.RE +.PP +\fB \-48 \fR +.RS 3n +48kHzで入力を行い,16kHzにダウンサンプリングしながら認識する. これは 16kHz のモデルを使用しているときのみ有効である. ダウンダンプリングの内部機能は +sptk +から 移植された. (Rev. 4.0) +.RE +.PP +\fB \-NA \fR \fIdevicename\fR +.RS 3n +DatLink サーバのデバイス名 (\fB\-input netaudio\fR). +.RE +.PP +\fB \-adport \fR \fIport_number\fR +.RS 3n + +\fB\-input adinnet\fR +使用時,接続を受け付ける adinnet のボート番号を指定する.(default: 5530) +.RE +.PP +\fB \-nostrip \fR +.RS 3n +音声取り込み時,デバイスやファイルによっては,音声波形中に振幅 が "0" となるフレームが存在することがある.Julius は通常,音声 入力に含まれるそのようなフレームを除去する.この零サンプル除去が うまく動かない場合,このオプションを指定することで自動消去を 無効化することができる. +.RE +.PP +\fB \-zmean \fR, \fB \-nozmean \fR +.RS 3n +入力音声ストリームに対して直流成分除去を行う.全ての音声処理の の前段として処理される. +\fB\-zmeansource\fRオプションも見よ. +.RE +.RE +.sp +.it 1 an-trap +.nr an-no-space-flag 1 +.nr an-break-flag 1 +.br +\fBレベルと零交差による入力検知\fR +.RS +.PP +\fB \-cutsilence \fR, \fB \-nocutsilence \fR +.RS 3n +レベルと零交差による入力検知を行うかどうかを指定する.デフォル トは,リアルタイム認識(デバイス直接入力およびネットワーク入力) では on, ファイル入力では off である.このオプションを指定する ことで,例えば長時間録音された音声ファイルに対して音声区間検出 を行いながら認識を行うこともできる. +.RE +.PP +\fB \-lv \fR \fIthres\fR +.RS 3n +振幅レベルのしきい値.値は 0 から 32767 の範囲で指定する. (default: 2000) +.RE +.PP +\fB \-zc \fR \fIthres\fR +.RS 3n +零交差数のしきい値.値は1秒あたりの交差数で指定する. (default: 60) +.RE +.PP +\fB \-headmargin \fR \fImsec\fR +.RS 3n +音声区間開始部のマージン.単位はミリ秒. (default: 300) +.RE +.PP +\fB \-tailmargin \fR \fImsec\fR +.RS 3n +音声区間終了部のマージン.単位はミリ秒. (default: 400) +.RE +.RE +.sp +.it 1 an-trap +.nr an-no-space-flag 1 +.nr an-break-flag 1 +.br +\fB入力棄却\fR +.RS +.PP +入力長,あるいは平均パワーによる入力の事後棄却が行える. 平均パワーによる棄却は,デフォルトでは無効化されており,ソースからコンパイ ルする際に +configureに +\-\-enable\-power\-reject +を指定することで有効となる. リアルタイム認識時で,かつ特徴量でパワー項を持つ場合のみ使用できる. +.PP +\fB \-rejectshort \fR \fImsec\fR +.RS 3n +検出された区間長が\fImsec\fR以下の入力を 棄却する.その区間の認識は中断・破棄される. +.RE +.PP +\fB \-powerthres \fR \fIthres\fR +.RS 3n +切り出し区間の平均パワーのしきい値.(Rev.4.0) +.sp +このオプションはコンパイル時に +\-\-enable\-power\-rejectが指定されたときに 有効となる. +.RE +.RE +.sp +.it 1 an-trap +.nr an-no-space-flag 1 +.nr an-break-flag 1 +.br +\fBGMM / GMM\-VAD\fR +.RS +.PP +\fB \-gmm \fR \fIhmmdefs_file\fR +.RS 3n +GMM定義ファイル.3状態(出力状態が1つのみ)のHMMとして定義す る.形式はHTK形式で与える.形式や使用できる特徴量の制限は音響 モデルと同じである. なお,GMMで用いるMFCC特徴量の設定は, +\fB\-AM_GMM\fRのあとに音響モデルと同様に指定する.こ の特徴量設定は音響モデルと別に,明示的に指定する必要があること に注意が必要である. +.RE +.PP +\fB \-gmmnum \fR \fInumber\fR +.RS 3n +GMM指定時,計算するガウス分布数を指定する.フレームごとにGMMの 出力確率を求める際,各モデルで定義されている混合ガウス分布のう ち,この\fInumber\fRで指定した数の上位ガ ウス分布の確率のみを計算する.小さな値を指定するほどGMMの計算 量を削減できるが,計算精度が悪くなる.(default: 10) +.RE +.PP +\fB \-gmmreject \fR \fIstring\fR +.RS 3n +GMMで定義されているモデル名のうち,非音声として棄却すべきモデ ルの名称を指定する.モデル名を複数指定することができる.複数指 定する場合は,空白を入れずコンマで区切って一つの +\fIstring\fRとして指定する. +.RE +.PP +\fB \-gmmmargin \fR \fIframes\fR +.RS 3n +(GMM_VAD) GMM VAD による区間検出の開始部マージン.単位はフレー ム数で指定する.(default: 20) (Rev. 4.0) +.sp +このオプションは\-\-enable\-gmm\-vad付きでコンパイル されたときに有効となる. +.RE +.PP +\fB \-gmmup \fR \fIvalue\fR +.RS 3n +(GMM_VAD) 音声区間の開始とみなす VAD スコアの閾値.VADスコアは (音声GMMの最大尤度 \- 非音声HMMの最大尤度) で表される. (Default: 0.7) (Rev.4.1) +.sp +このオプションは\-\-enable\-gmm\-vad付きでコンパイル されたときに有効となる. +.RE +.PP +\fB \-gmmdown \fR \fIvalue\fR +.RS 3n +(GMM_VAD) 音声区間の終了とみなす VAD スコアの閾値.VADスコアは (音声GMMの最大尤度 \- 非音声HMMの最大尤度) で表される. (Default: \-0.2) (Rev.4.1) +.sp +このオプションは\-\-enable\-gmm\-vad付きでコンパイル されたときに有効となる. +.RE +.RE +.sp +.it 1 an-trap +.nr an-no-space-flag 1 +.nr an-break-flag 1 +.br +\fBデコーディングオプション\fR +.RS +.PP +デコーディングオプションは,使用する認識アルゴリズムに関する設定を行う オプションである.この設定はエンジン全体に対する設定であり,全ての認識 処理インスタンスで共通の設定となる.探索の幅や言語重みなどの個々のデコー ディング設定については,認識処理インスタンスごとに指定する. +.PP +\fB \-realtime \fR, \fB \-norealtime \fR +.RS 3n +入力と並行してリアルタイム認識を行うかどうかを明示的に指定する. デフォルトの設定は入力デバイスに依存し,マイクロフォン等のデバ イス直接認識,ネットワーク入力,および DatLink/NetAudio 入力の 場合は ON, ファイル入力や特徴量入力についてはOFFとなっている. +.RE +.RE +.sp +.it 1 an-trap +.nr an-no-space-flag 1 +.nr an-break-flag 1 +.br +\fBその他\fR +.RS +.PP +\fB \-C \fR \fIjconffile\fR +.RS 3n +jconf設定ファイルを読み込む.ファイルの内容がこの場所に展開される. +.RE +.PP +\fB \-version \fR +.RS 3n +バージョン情報を標準エラー出力に出力して終了する. +.RE +.PP +\fB \-setting \fR +.RS 3n +エンジン設定情報を標準エラー出力に出力して終了する. +.RE +.PP +\fB \-quiet \fR +.RS 3n +出力を抑制する.認識結果は単語列のみが出力される. +.RE +.PP +\fB \-debug \fR +.RS 3n +(デバッグ用) モデルの詳細や探索過程の記録など,様々な デバッグ情報をログに出力する. +.RE +.PP +\fB \-check \fR {wchmm|trellis|triphone} +.RS 3n +デバッグ用のチェックモードに入る. +.RE +.PP +\fB \-plugindir \fR \fIdirlist\fR +.RS 3n +プラグインを読み込むディレクトリを指定する.複数の場合は コロンで区切って並べて指定する. +.RE +.RE +.SS "複数モデル認識のためのインスタンス宣言" +.PP +\fB \-AM \fR \fIname\fR +.RS 3n +音響モデルインスタンスを新たに宣言する.以降の音響モデルに関す る設定はこのインスタンスに対するものと解釈される. +\fIname\fR +にはインスタンスにつける名前を 指定する(既にある音響モデルインスタンスと同じ名前であってはい けない). (Rev.4.0) +.RE +.PP +\fB \-LM \fR \fIname\fR +.RS 3n +言語モデルインスタンスを新たに宣言する.以降の言語モデルに関す る設定はこのインスタンスに対するものと解釈される. +\fIname\fR +にはインスタンスにつける名前を 指定する(既にある言語モデルインスタンスと同じ名前であってはい けない). (Rev.4.0) +.RE +.PP +\fB \-SR \fR \fIname\fR \fIam_name\fR \fIlm_name\fR +.RS 3n +認識処理インスタンスを新たに宣言する.以降の認識処理や探索に関 する設定はこのインスタンスに対するものと解釈される. +\fIname\fR +にはインスタンスにつける名前を 指定する(既にある認識処理インスタンスと同じ名前であってはいけ ない).\fIam_name\fR, +\fIlm_name\fR +にはそれぞれこのインスタン スが使用する音響モデルと言語モデルのインスタンスを名前,あるい は ID 番号で指定する.(Rev.4.0) +.RE +.PP +\fB \-AM_GMM \fR +.RS 3n +GMM使用時に,GMM計算のための特徴量抽出パラメータを,この宣言の あとに指定する.もし GMM 使用時にこのオプションでGMM用の特徴量 パラメータを指定しなかった場合,最後に指定した音響モデル用の特 徴量がそのまま用いられる. (Rev.4.0) +.RE +.PP +\fB \-GLOBAL \fR +.RS 3n +全体オプション用のセクションを開始する.\fB\-AM\fR, +\fB\-LM\fR, +\fB\-SR\fR +などのインスタンス 宣言を用いる場合,音声入力設定などの全体オプションは,これらの 全てのインスタンス定義よりも前か,あるいはこのオプションの あとに指定する必要がある.この全体オプション用のセクションは, jconf 内で何回現れても良い. (Rev.4.1) +.RE +.PP +\fB \-nosectioncheck \fR, \fB \-sectioncheck \fR +.RS 3n +複数インスタンスを用いる jconf において,オプションの位置チェッ クの有効・無効を指定する.有効である場合,ある種類のインスタン スの宣言がされたあとは,他のインスタンス宣言が現れるまで,その インスタンスのオプションしか指定できない(例: +\fB\-AM\fR +のあと,他の +\fB\-AM\fRや +\fB\-LM\fRなどが現れるまで,音響モデルオプションしか 指定できない.他のオプションがあらわれた場合はエラーとなる). また,全体オプションは全てのモデルインスタンスの前に指定する必 要がある.デフォルトでは有効になっている.(Rev.4.1) +.RE +.SS "言語モデル (\fB\-LM\fR)" +.PP +このグループには,各モデルタイプごとに指定するオプションが含まれている. 一つのインスタンスには一つのモデルタイプだけが指定可能である. +.sp +.it 1 an-trap +.nr an-no-space-flag 1 +.nr an-break-flag 1 +.br +\fBN\-gram\fR +.RS +.PP +\fB \-d \fR \fIbingram_file\fR +.RS 3n +使用するN\-gramをバイナリファイル形式で指定する. バイナリ形式への変換は +mkbingram +を 使用する. +.RE +.PP +\fB \-nlr \fR \fIarpa_ngram_file\fR +.RS 3n +前向き (left\-to\-right) のN\-gram 言語モデルを指定する. +\fIarpa_ngram_file\fR +はARPA標準形式のファ イルである必要がある. +.RE +.PP +\fB \-nrl \fR \fIarpa_ngram_file\fR +.RS 3n +後ろ向き (right\-to\-left) のN\-gram 言語モデルを指定する. +\fIarpa_ngram_file\fR +はARPA標準形式のファ イルである必要がある. +.RE +.PP +\fB \-v \fR \fIdict_file\fR +.RS 3n +N\-gram,または文法用の単語辞書ファイルを指定する. +.RE +.PP +\fB \-silhead \fR \fIword_string\fR \fB \-siltail \fR \fIword_string\fR +.RS 3n +音声入力両端の無音区間に相当する「無音単語」エントリを指定する. 単語の読み(N\-gramエントリ名),あるいは"#"+単語番号(辞書ファ イルの行番号\-1)で指定する.デフォルトはそれぞれ "", "" である. +.RE +.PP +\fB \-iwspword \fR +.RS 3n +ポーズに対応する無音単語を辞書に追加する.追加される単語の内容は オプション\fB\-iwspentry\fRで変更できる. +.RE +.PP +\fB \-iwspentry \fR \fIword_entry_string\fR +.RS 3n + +\fB\-iwspword\fR指定時に追加される単語エントリの内容 を指定する.辞書エントリと同じ形式で指定する.(default: " [sp] sp sp") +.RE +.PP +\fB \-sepnum \fR \fInumber\fR +.RS 3n +木構造化辞書の構築時に線形登録する単語数を指定する.(default: 150) +.RE +.RE +.sp +.it 1 an-trap +.nr an-no-space-flag 1 +.nr an-break-flag 1 +.br +\fB文法\fR +.RS +.PP + +\fB\-gram\fRや\fB\-gramlist\fRで文法を複数回指定す ることで,一つのインスタンス内で複数の文法を用いることができる. (旧Juliusのオプション +\fB\-dfa\fR, +\fB\-v\fR +の 組合せは単一の文法のみ指定可能である) +.PP +\fB \-gram \fR gramprefix1[,gramprefix2[,gramprefix3,...]] +.RS 3n +認識に使用する文法を指定する.文法はファイル(辞書および構文制約 有限オートマトン)のプレフィックスで指定する.すなわち,ある認 識用文法が\fIdir/foo.dict\fRと +\fIdir/foo.dfa\fR +としてあるとき, +dir/fooのように拡張子を省いた名前で指定する. 文法はコンマで区切って複数指定することができる.また繰り返し 使用することでも複数指定できる. +.RE +.PP +\fB \-gramlist \fR \fIlist_file\fR +.RS 3n +認識に使用する文法のリストをファイルで指定する. +\fIlist_file\fRには, +\fB\-gram\fR +と同様の文法プレフィックスを1行に1つず つ記述する.また,このオプションを繰り返し使用することで,複数 のリストファイルを指定できる.なお,リスト内で文法を相対パスで 指定した場合,それは,そのリストファイルからの相対パスとして解 釈されることに注意が必要である. +.RE +.PP +\fB \-dfa \fR \fIdfa_file\fR \fB \-v \fR \fIdict_file\fR +.RS 3n +認識に使用する文法の構文制約オートマトンと辞書をそれぞれ指定する. (Julius\-3.x との互換性のための古いオプションであり,使用すべきでない) +.RE +.PP +\fB \-nogram \fR +.RS 3n +それまでに +\fB\-gram\fR,\fB\-gramlist\fR, +\fB\-dfa\fR +および +\fB\-v\fR +で 指定された文法のリストをクリアし,文法の指定なしの状態 にする. +.RE +.RE +.sp +.it 1 an-trap +.nr an-no-space-flag 1 +.nr an-break-flag 1 +.br +\fB単単語\fR +.RS +.PP +\fB \-w \fR \fIdict_file\fR +.RS 3n +単単語認識で用いる単語辞書を指定する.ファイル形式は単語N\-gram や文法と同一である.辞書上の全ての単語が認識対象となる. (Rev.4.0) +.RE +.PP +\fB \-wlist \fR \fIlist_file\fR +.RS 3n +単語辞書のリストを指定する.\fIlist_file\fR +には1行に一つずつ,使用する単語辞書のパスを記述する.相対パスを 用いた場合,それはその\fIlist_file\fRから の相対パスとして解釈される. (Rev.4.0) +.RE +.PP +\fB \-nogram \fR +.RS 3n +それまでに +\fB\-w\fR +あるいは +\fB\-wlist\fRで 指定された辞書のリストをクリアし,指定なしの状態に戻す. +.RE +.PP +\fB \-wsil \fR \fIhead_sil_model_name\fR \fItail_sil_model_name\fR \fIsil_context_name\fR +.RS 3n +単単語認識時,音声入力の両端の無音モデルおよびそのコンテキスト 名を指定する. +\fIsil_context_name\fRとして +NULLを指定した場合,各モデル名がそのまま コンテキストとして用いられる. +.RE +.RE +.sp +.it 1 an-trap +.nr an-no-space-flag 1 +.nr an-break-flag 1 +.br +\fBUser\-defined LM\fR +.RS +.PP +\fB \-userlm \fR +.RS 3n +プログラム中のユーザ定義言語スコア計算関数を使用することを宣言 する.(Rev.4.0) +.RE +.RE +.sp +.it 1 an-trap +.nr an-no-space-flag 1 +.nr an-break-flag 1 +.br +\fBその他の言語モデル関連\fR +.RS +.PP +\fB \-forcedict \fR +.RS 3n +単語辞書読み込み時のエラーを無視する.通常Juliusは単語辞書内に エラーがあった場合そこで動作を停止するが,このオプションを 指定することで,エラーの生じる単語をスキップして処理を続行する ことができる. +.RE +.RE +.SS "音響モデル・特徴量抽出 (\fB\-AM\fR) (\fB\-AM_GMM\fR)" +.PP +音響モデルオプションは,音響モデルおよび特徴量抽出・フロントエンド処理 に関する設定を行う.特徴量抽出,正規化処理,スペクトルサブトラクションの 指定もここで行う. +.sp +.it 1 an-trap +.nr an-no-space-flag 1 +.nr an-break-flag 1 +.br +\fB音響HMM関連\fR +.RS +.PP +\fB \-h \fR \fIhmmdef_file\fR +.RS 3n +使用するHMM定義ファイル. +HTK +の ASCII 形 式ファイル,あるいはJulius バイナリ形式のファイルのどちらかを 指定する.バイナリ形式へは +mkbinhmm +で 変換できる. +.RE +.PP +\fB \-hlist \fR \fIhmmlist_file\fR +.RS 3n +HMMlistファイルを指定する.テキスト形式,あるいはバイナリ形式 のどちらかを指定する.バイナリ形式へは +mkbinhmmlist +で変換できる. +.RE +.PP +\fB \-tmix \fR \fInumber\fR +.RS 3n +Gaussianpruning の計算状態数を指定する.小さ いほど計算が速くなるが,音響尤度の誤差が大きくなる.See also +\fB\-gprune\fR. (default: 2) +.RE +.PP +\fB \-spmodel \fR \fIname\fR +.RS 3n +文中のショートポーズに対応する音韻HMMの名前を指定する.このポーズ モデル名は,\fB\-iwsp\fR, +\fB\-spsegment\fR, +\fB\-pausemodels\fRに関係する.また,文法使用時に スキップ可能なポーズ単語エントリの識別にも用いられる. (default: "sp") +.RE +.PP +\fB \-multipath \fR \fB \-nomultipath \fR +.RS 3n +状態間遷移を拡張するマルチパスモードを有効にする.オプション指 定がない場合,Julius は音響モデルの遷移をチェックし,必要であ れば自動的にマルチパスモードを有効にする.このオプションは,ユー ザが明示的にモードを指定したい場合に使用する. +.sp +この機能は 3.x ではコンパイル時オプションであったが,4.0 より 実行時オプションとなった.(rev.4.0) +.RE +.PP +\fB \-gprune \fR {safe|heuristic|beam|none|default} +.RS 3n +使用する Gaussian pruning アルゴリズムを選択する. +noneを指定すると Gaussian pruning を無効化 しすべてのガウス分布について厳密に計算する. +safe +は上位 N 個を計算する. +heuristic +と +beam +はsafe に比べてより積極的な枝刈りを行うため計算量削減の効果が大きいが, 認識精度の低下を招く可能性がある.defaultが 指定された場合,デフォルトの手法を使う.(default: tied\-mixture model の場合,standard 設定ではsafe,fast設 定ではbeam.tied\-mixture でない場合 +none). +.RE +.PP +\fB \-iwcd1 \fR {max|avg|best number} +.RS 3n +第1パスの単語間トライフォン計算法を指定する. +max +指定時,同じコンテキストのトライフォン集合の 全尤度の最大値を近似尤度として用いる.avg +は 全尤度の平均値を用いる.best number +は上位 N 個の トライフォンの平均値を用いる. デフォルトは,一緒に使用される言語モデルに依存する.N\-gram使用 時には +best 3,文法使用時は +avgとなる.もしこの音響モデルが異なるタイプの 複数の言語モデルで共有される場合は,後に定義されたほうのデフォルトが デフォルト値として用いられる. +.RE +.PP +\fB \-iwsppenalty \fR \fIfloat\fR +.RS 3n + +\fB\-iwsp\fRによって末尾に付加される単語末ショートポー ズの挿入ペナルティ.ここで指定した値が,通常単語の末尾から単語 末ショートポーズへの遷移に追加される. +.RE +.PP +\fB \-gshmm \fR \fIhmmdef_file\fR +.RS 3n +Gaussian Mixture Selection 用のモノフォン音響モデルを指定する. GMS用モノフォンは通常のモノフォンから +mkgshmm +によって生成できる. +.RE +.PP +\fB \-gsnum \fR \fInumber\fR +.RS 3n +GMS 使用時,対応するトライフォンを詳細計算するモノフォンの 状態の数を指定する. (default: 24) +.RE +.RE +.sp +.it 1 an-trap +.nr an-no-space-flag 1 +.nr an-break-flag 1 +.br +\fB特徴量抽出パラメータ\fR +.RS +.PP +\fB \-smpPeriod \fR \fIperiod\fR +.RS 3n +音声のサンプリング周期を指定する.単位は,100ナノ秒の単位で指 定する.サンプリング周期は +\fB\-smpFreq\fR +でも指定 可能.(default: 625) +.sp +このオプションは +HTK +の +SOURCERATE +に対応する.同じ値が指定できる. +.sp +複数の音響モデルを用いる場合,全インスタンスで共通の値を指定する必要 がある. +.RE +.PP +\fB \-smpFreq \fR \fIHz\fR +.RS 3n +音声のサンプリング周波数 (Hz) を指定する.(default: 16,000) +.sp +複数の音響モデルを用いる場合,全インスタンスで共通の値を指定する必要 がある. +.RE +.PP +\fB \-fsize \fR \fIsample_num\fR +.RS 3n +窓サイズをサンプル数で指定 (default: 400). +.sp +このオプションは +HTK +の +WINDOWSIZE +に対応する.ただし値はHTKと異なり,(HTKの値 / smpPeriod) となる. +.sp +複数の音響モデルを用いる場合,全インスタンスで共通の値を指定する必要 がある. +.RE +.PP +\fB \-fshift \fR \fIsample_num\fR +.RS 3n +フレームシフト幅をサンプル数で指定 (default: 160). +.sp +このオプションは +HTK +の +TARGETRATE +に対応する.ただし値はHTKと異なり,(HTKの値 / smpPeriod) となる. +.sp +複数の音響モデルを用いる場合,全インスタンスで共通の値を指定する必要 がある. +.RE +.PP +\fB \-preemph \fR \fIfloat\fR +.RS 3n +プリエンファシス係数 (default: 0.97) +.sp +このオプションは +HTK +の +PREEMCOEF +に対応する.同じ値が指定できる. +.RE +.PP +\fB \-fbank \fR \fInum\fR +.RS 3n +フィルタバンクチャンネル数.(default: 24) +.sp +このオプションは +HTK +の +NUMCHANS +に対応する.同じ値が指定できる.指定しないときのデフォルト値が +HTKと異なっていることに注意(HTKでは22). +.RE +.PP +\fB \-ceplif \fR \fInum\fR +.RS 3n +ケプストラムのリフタリング係数. (default: 22) +.sp +このオプションは +HTK +の +CEPLIFTER +に対応する.同じ値が指定できる. +.RE +.PP +\fB \-rawe \fR, \fB \-norawe \fR +.RS 3n +エネルギー項の値として,プリエンファシス前の raw energy を使用 する / しない (default: disabled=使用しない) +.sp +このオプションは +HTK +の +RAWENERGY +に対応する. 指定しないときのデフォルトがHTKと異なっていることに注意(HTKで はenabled). +.RE +.PP +\fB \-enormal \fR, \fB \-noenormal \fR +.RS 3n +エネルギー項の値として,発話全体の平均で正規化した正規化エネルギー を用いるかどうかを指定する.(default: \-noenormal) +.sp +このオプションは +HTK +の +ENORMALISE +に対応する. 指定しないときのデフォルトがHTKと異なっていることに注意(HTKで はenabled). +.RE +.PP +\fB \-escale \fR \fIfloat_scale\fR +.RS 3n +エネルギー正規化時の,対数エネルギー項のスケーリング係数. (default: 1.0) +.sp +このオプションは +HTK +の +ESCALE +に対応する.デフォルト値がHTKと異なっていることに注意(HTKでは 0.1). +.RE +.PP +\fB \-silfloor \fR \fIfloat\fR +.RS 3n +エネルギー正規化時の,無音部のエネルギーのフロアリング値. (default: 50.0) +.sp +このオプションは +HTK +の +SILFLOOR +に対応する.同じ値が指定できる. +.RE +.PP +\fB \-delwin \fR \fIframe\fR +.RS 3n +一次差分計算用のウィンドウフレーム幅.(default: 2) +.sp +このオプションは +HTK +の +DELTAWINDOW +に対応する.同じ値が指定できる. +.RE +.PP +\fB \-accwin \fR \fIframe\fR +.RS 3n +二次差分計算用のウィンドウフレーム幅.(default: 2) +.sp +このオプションは +HTK +の +ACCWINDOW +に対応する.同じ値が指定できる. +.RE +.PP +\fB \-hifreq \fR \fIHz\fR +.RS 3n +MFCCのフィルタバンク計算時におけるバンド制限を有効化する.この オプションではカットオフ周波数の上限値を指定する. \-1 を指定することで無効化できる.(default: \-1) +.sp +このオプションは +HTK +の +HIFREQ +に対応する.同じ値が指定できる. +.RE +.PP +\fB \-lofreq \fR \fIHz\fR +.RS 3n +MFCCのフィルタバンク計算時におけるバンド制限を有効化する.この オプションではカットオフ周波数の下限値を指定する. \-1 を指定することで無効化できる.(default: \-1) +.sp +このオプションは +HTK +の +LOFREQ +に対応する.同じ値が指定できる. +.RE +.PP +\fB \-zmeanframe \fR, \fB \-nozmeanframe \fR +.RS 3n +窓単位の直流成分除去を有効化/無効化する. (default: disabled) +.sp +このオプションは +HTK +の +ZMEANSOURCE +に対応する.\fB\-zmean\fR +も参照のこと. +.RE +.PP +\fB \-usepower \fR +.RS 3n +フィルタバンク解析で振幅の代わりにパワーを使う.(default: disabled) +.RE +.RE +.sp +.it 1 an-trap +.nr an-no-space-flag 1 +.nr an-break-flag 1 +.br +\fB正規化処理\fR +.RS +.PP +\fB \-cvn \fR +.RS 3n +ケプストラム分散正規化 (cepstral variance normalization; CVN) を有効にする.ファイル入力では,入力全体の分散に基づいて正規化 が行われる.直接入力ではあらかじめ分散が得られないため,最後の 入力の分散で代用される.音声信号入力でのみ有効である. +.RE +.PP +\fB \-vtln \fR \fIalpha\fR \fIlowcut\fR \fIhicut\fR +.RS 3n +周波数ワーピングを行う.声道長正規化 (vocal tract length normalization; VTLN) に使用できる.引数はそれぞれワーピング 係数,周波数上端,周波数下端であり,HTK設定の +WARPFREQ,WARPHCUTOFF +および +WARPLCUTOFF +に対応する. +.RE +.PP +\fB \-cmnload \fR \fIfile\fR +.RS 3n +起動時にケプストラム平均ベクトルを +\fIfile\fRから読み込む.ファイルは +\fB\-cmnsave\fR +で保存されたファイルを指定する.これ は MAP\-CMN において,起動後最初の発話においてケプストラム平均 の初期値として用いられる.通常,2発話目以降は初期値は,直前の 入力の平均に更新されるが,\fB\-cmnnoupdate\fRを指定 された場合,常にこのファイルの値が各発話の初期値として用いられ る. +.RE +.PP +\fB \-cmnsave \fR \fIfile\fR +.RS 3n +認識中に計算したケプストラム平均ベクトルを +\fIfile\fRへ保存する.すでにファイルがあ る場合は上書きされる.この保存は音声入力が行われるたびに上書きで 行われる. +.RE +.PP +\fB \-cmnupdate \fR \fB \-cmnnoupdate \fR +.RS 3n +実時間認識時,初期ケプストラム平均を入力ごとに更新するかどうか を指定する.通常は有効 (\fB\-cmnupdate\fR) であり, 過去5秒間の入力の平均を初期値として更新する. +\fB\-cmnnoupdate\fR +が指定された場合,更新は行われず, 初期値は起動時の値に固定される.\fB\-cmnload\fR +で初期値 を指定することで,常に同じ初期値を使うようにすることができる. +.RE +.PP +\fB \-cmnmapweight \fR \fIfloat\fR +.RS 3n +MAP\-CMN の初期ケプストラム平均への重みを指定する.値が大きいほ ど初期値に長時間依存し,小さいほど早く現入力のケプストラム平均 を用いるようになる.(default: 100.0) +.RE +.RE +.sp +.it 1 an-trap +.nr an-no-space-flag 1 +.nr an-break-flag 1 +.br +\fBフロントエンド処理\fR +.RS +.PP +\fB \-sscalc \fR +.RS 3n +入力先頭の無音部を用いて,入力全体に対してスペクトルサブトラク ションを行う.先頭部の長さは\fB\-sscalclen\fRで指定する. ファイル入力に対してのみ有効である.\fB\-ssload\fR +と 同時に指定できない. +.RE +.PP +\fB \-sscalclen \fR \fImsec\fR +.RS 3n + +\fB\-sscalc\fRオプション指定時,各ファイルにおいて ノイズスペクトルの推定に用いる長さをミリ秒で指定する.(default: 300) +.RE +.PP +\fB \-ssload \fR \fIfile\fR +.RS 3n +ノイズスペクトルを\fIfile\fRから読み込ん でスペクトルサブトラクションを行う. +\fIfile\fRはあらかじめ +mkssで作成する.マイク入力・ネットワーク入 力などのオンライン入力でも適用できる.\fB\-sscalc\fRと 同時に指定できない. +.RE +.PP +\fB \-ssalpha \fR \fIfloat\fR +.RS 3n + +\fB\-sscalc\fRおよび\fB\-ssload\fR用の 減算係数を指定する.この値が大きいほど強くスペクトル減算を行うが, 減算後の信号の歪も大きくなる.(default: 2.0) +.RE +.PP +\fB \-ssfloor \fR \fIfloat\fR +.RS 3n +スペクトルサブトラクションのフロアリング係数を指定する.スペク トル減算時,計算の結果パワースペクトルが負となってしまう帯域に 対しては,原信号にこの係数を乗じたスペクトルが割り当てられる. (default: 0.5) +.RE +.RE +.sp +.it 1 an-trap +.nr an-no-space-flag 1 +.nr an-break-flag 1 +.br +\fBその他の音響モデル関連オプション\fR +.RS +.PP +\fB \-htkconf \fR \fIfile\fR +.RS 3n + +HTK +Config ファイルを解析して,対応する特徴量抽出オプションを Julius に自動設定する.\fIfile\fR +は +HTK +で音響モデル学習時に使用した Config ファイルを指定する.なお, Julius と +HTK +ではパラメータのデフォルト値が一部異なるが, このオプションを使用する場合,デフォルト値も +HTK +のデフォルト に切替えれられる. +.RE +.RE +.SS "認識処理・探索 (\fB\-SR\fR)" +.PP +認識処理・探索オプションは,第1パス・第2パス用のビーム幅や言語重みのパラメータ,ショートポーズセグメンテーションの設定,単語ラティス・CN 出力用設定,forced alignment の指定,その他の認識処理と結果出力に関するパラメータを含む. +.sp +.it 1 an-trap +.nr an-no-space-flag 1 +.nr an-break-flag 1 +.br +\fB第1パスパラメータ\fR +.RS +.PP +\fB \-lmp \fR \fIweight\fR \fIpenalty\fR +.RS 3n +(N\-gram使用時) 第1パス用の言語スコア重みおよび挿入ペナルティ. ペナルティは負であれば単語挿入を抑制し,正であれば単語挿入を促 進する. +.RE +.PP +\fB \-penalty1 \fR \fIpenalty\fR +.RS 3n +(文法使用時) 第1パス用の単語挿入ペナルティ. (default: 0.0) +.RE +.PP +\fB \-b \fR \fIwidth\fR +.RS 3n +第1パス探索の枝刈り (rank pruning) のビーム幅を指定する.単位 は HMM ノード数である. デフォルト値は音響モデルやエンジンの設定による.モノフォン 使用時は400, トライフォン使用時は800,トライフォンでかつ setup=v2.1 のときは 1000 となる. +.RE +.PP +\fB \-nlimit \fR \fInum\fR +.RS 3n +第1パスでノードごとに保持する仮説トークンの最大数.通常は 1 で 固定されており変更できない.コンパイル時に +configureで +\-\-enable\-wpairおよび +\-\-enable\-wpair\-nlimit +が指定されているとき のみ変更できる. +.RE +.PP +\fB \-progout \fR +.RS 3n +第1パスで,一定時間おきにその時点での最尤仮説系列を出力する. +.RE +.PP +\fB \-proginterval \fR \fImsec\fR +.RS 3n + +\fB\-progout\fRの出力インターバルをミリ秒で指定する. (default: 300) +.RE +.RE +.sp +.it 1 an-trap +.nr an-no-space-flag 1 +.nr an-break-flag 1 +.br +\fB第2パスパラメータ\fR +.RS +.PP +\fB \-lmp2 \fR \fIweight\fR \fIpenalty\fR +.RS 3n +(N\-gram使用時) 第2パス用の言語スコア重みおよび挿入ペナルティ. ペナルティは負であれば単語挿入を抑制し,正であれば単語挿入を促 進する. +.RE +.PP +\fB \-penalty2 \fR \fIpenalty\fR +.RS 3n +(文法使用時) 第2パス用の単語挿入ペナルティ. (default: 0.0) +.RE +.PP +\fB \-b2 \fR \fIwidth\fR +.RS 3n +第2パス探索における仮説展開回数の上限を指定する.単位は 仮説数.(default: 30) +.RE +.PP +\fB \-sb \fR \fIfloat\fR +.RS 3n +第2パスの仮説尤度計算時のスコア幅を指定する.単位は対数尤度差 である.(default: 80.0) +.RE +.PP +\fB \-s \fR \fInum\fR +.RS 3n +仮説のスタックサイズを指定する.(default: 500) +.RE +.PP +\fB \-n \fR \fInum\fR +.RS 3n + +\fInum\fR個の文仮説数が見付かるまで探索を 行う.得られた仮説はスコアでソートされて出力される (\fB\-output\fRも見よ).デフォルト値はコンパイル時 のエンジン設定によって変わり,fast 版では 1, standard版では10 である. +.RE +.PP +\fB \-output \fR \fInum\fR +.RS 3n +見つかったN\-best候補のうち,結果として出力する文仮説の数を 指定する.\fB\-n\fRも参照のこと.(default: 1) +.RE +.PP +\fB \-m \fR \fIcount\fR +.RS 3n +探索打ち切りのための仮説展開回数のしきい値を指定する. (default: 2000) +.RE +.PP +\fB \-lookuprange \fR \fIframe\fR +.RS 3n +第2パスの単語展開時に,接続しうる次単語候補を見付けるための 終端時刻の許容幅をフレーム数で指定する.値を大きくするほど その周辺の多くの仮説を次単語候補として仮説展開が行われるように なるが,探索が前に進みにくくなることがある.(default: 5) +.RE +.PP +\fB \-looktrellis \fR +.RS 3n +仮説展開を第1パスの結果単語トレリス上に絞る. +.RE +.RE +.sp +.it 1 an-trap +.nr an-no-space-flag 1 +.nr an-break-flag 1 +.br +\fBショートポーズセグメンテーション\fR +.RS +.PP +\fB \-spsegment \fR +.RS 3n +ショートポーズセグメンテーションを有効にする. (Rev.4.0) +.RE +.PP +\fB \-spdur \fR \fIframe\fR +.RS 3n +無音区間判定のためのしきい値を指定する.無音単語が一位仮説とな るフレームがこの値以上続いたとき,無音区間として入力が区切られ る.(default: 10) +.RE +.PP +\fB \-pausemodels \fR \fIstring\fR +.RS 3n +「無音単語」を定義するための音響モデルにおける無音モデルの名前 を指定する.コンマで区切って複数の名前を指定できる. このオプションが指定されない場合,文法を用いた認識では +\fB\-spmodel\fR +で指定されるモデルのみを読みとする単 語が無音単語とされる.また,N\-gramではこれに加えて +\fB\-silhead\fR +および +\fB\-siltail\fR +で 指定される単語も無音単語として扱われる.(Rev.4.0) +.RE +.PP +\fB \-spmargin \fR \fIframe\fR +.RS 3n +デコーダベースVADにおいて,アップトリガ時の巻戻し幅をフレーム 数で指定する.(Rev.4.0) +.sp +このオプションはconfigureに +\-\-enable\-decoder\-vadを付けてコンパイルしたとき のみ有効である. +.RE +.PP +\fB \-spdelay \fR \fIframe\fR +.RS 3n +デコーダベースVADにおいて,アップトリガ判定の遅延幅をフレーム 数で指定する.(Rev.4.0) +.sp +このオプションはconfigureに +\-\-enable\-decoder\-vadを付けてコンパイルしたとき のみ有効である. +.RE +.RE +.sp +.it 1 an-trap +.nr an-no-space-flag 1 +.nr an-break-flag 1 +.br +\fB単語ラティス / confusion network 出力\fR +.RS +.PP +\fB \-lattice \fR, \fB \-nolattice \fR +.RS 3n +単語グラフ(ラティス)の出力を有効化/無効化する. +.RE +.PP +\fB \-confnet \fR, \fB \-noconfnet \fR +.RS 3n +Confusion network の出力を有効化/無効化する.confusion network は単語グラフから生成されるため,有効時は同時に +\fB\-lattice\fR +も有効化される.(Rev.4.0) +.RE +.PP +\fB \-graphrange \fR \fIframe\fR +.RS 3n +グラフ生成において近傍の同一単語仮説をマージする.開始フレーム および終了フレームの位置の差がそれぞれ +\fIframe\fR以下の同一単語仮説についてマー ジする.その際,スコアは高いほうのものが残される.値が \-1 の場 合,マージは一切行われない.値を大きくするほどコンパクトなグラ フが生成されるが,スコアの誤差が大きくなる.このオプションは +\fB\-confnet\fRにも影響する.(default: 0) +.RE +.PP +\fB \-graphcut \fR \fIdepth\fR +.RS 3n +生成されたグラフに対して,深さによるカットオフを行う. +\fIdepth\fRは,あるフレームにおいて存在可 能な単語数の上限を指定する.Julius では,第2パスの探索が不安定 な場合,一部分が極端に深いグラフが生成されることが稀にあり,こ のオプションによってそれを抑制することができる.\-1 を指定する ことでこの機能は無効化される.(default: 80) +.RE +.PP +\fB \-graphboundloop \fR \fIcount\fR +.RS 3n +事後的に行われる単語グラフの境界時間調整において,振動による 無限ループを防ぐための打ち切り値を指定する.(default: 20) +.RE +.PP +\fB \-graphsearchdelay \fR, \fB \-nographsearchdelay \fR +.RS 3n +巨大グラフ生成用にアルゴリズムをチューニングする.このオプショ ンが有効時,Julius は第1文仮説が見つかる前のグラフ生成時の仮説 中断を行わないように,グラフ生成アルゴリズムを変更する.これは, ビーム幅や探索範囲を極端に大きくして巨大なワードグラフを生成し ようとするときに,グラフの精度を改善することがある.(default: disabled) +.RE +.RE +.sp +.it 1 an-trap +.nr an-no-space-flag 1 +.nr an-break-flag 1 +.br +\fB複数文法/複数辞書認識\fR +.RS +.PP +文法や単単語認識において,一つのインスタンスで複数の文法や辞書を用いる 場合に指定できるオプションである. +.PP +\fB \-multigramout \fR, \fB \-nomultigramout \fR +.RS 3n +複数文法あるいは複数辞書を用いて認識を行う場合,通常の Julius は全ての文法/辞書の中から最尤仮説を出力する.このオプションを 指定することで,与えられた個々の文法/辞書ごとに一位仮説を 出力することができる.(default: disabled) +.RE +.RE +.sp +.it 1 an-trap +.nr an-no-space-flag 1 +.nr an-break-flag 1 +.br +\fBForced alignment\fR +.RS +.PP +\fB \-walign \fR +.RS 3n +認識結果を用いて,入力に対する単語単位の forced alignment を行 う.単語の境界フレームと平均音響尤度が出力される. +.RE +.PP +\fB \-palign \fR +.RS 3n +認識結果を用いて,入力に対する音素単位の forced alignment を行 う.音素ごとの境界フレームと平均音響尤度が出力される. +.RE +.PP +\fB \-salign \fR +.RS 3n +認識結果を用いて,入力に対するHMMの状態単位の forced alignment を行う.状態ごとの境界フレームと平均音響尤度が出力される. +.RE +.RE +.sp +.it 1 an-trap +.nr an-no-space-flag 1 +.nr an-break-flag 1 +.br +\fBその他\fR +.RS +.PP +\fB \-inactive \fR +.RS 3n +認識処理インスタンスを一時停止状態 (inactive state) で起動する. (Rev.4.0) +.RE +.PP +\fB \-1pass \fR +.RS 3n +第1パスのみを実行する.このオプションを指定した場合,第2パスは 実行されない. +.RE +.PP +\fB \-fallback1pass \fR +.RS 3n +通常,第2パスの探索が失敗したとき,Julius は認識結果無しで終了 する.このオプションを指定することで,そのような第2パスの失敗時に, 第1パスの最尤仮説を最終結果として出力することができる. (これはJulius\-3.xでのデフォルトの振る舞いである) +.RE +.PP +\fB \-no_ccd \fR, \fB \-force_ccd \fR +.RS 3n +音響モデルを音素コンテキスト依存モデルとして扱うかどうかを明示 的に指定する.デフォルトはHMM中のモデル名から自動判断される. +.sp +.RE +.PP +\fB \-cmalpha \fR \fIfloat\fR +.RS 3n +確信度計算のためのスコアのスムージング係数.(default: 0.05) +.RE +.PP +\fB \-iwsp \fR +.RS 3n +(マルチパスモード時のみ有効)単語間にショートポーズモデルを 挟み込んだ認識処理を行う.このオプションを指定すると,辞書上の 全単語の末尾に,スキップ可能なショートポーズモデルが付加される. このショートポーズモデルはコンテキストを考慮せず,また前後の 音素のコンテキストにも表れない.付加するショートポーズモデルは +\fB\-spmodel\fR +で指定できる. +.RE +.PP +\fB \-transp \fR \fIfloat\fR +.RS 3n +透過単語に対する追加の挿入ペナルティを指定する.(default: 0.0) +.RE +.PP +\fB \-demo \fR +.RS 3n + +\fB\-progout \-quiet\fRと同等. +.RE +.RE +.SH "ENVIRONMENT VARIABLES" +.PP +\fB \fR\fB\fBALSADEV\fR\fR\fB \fR +.RS 3n +(マイク入力で alsa デバイス使用時) 録音デバイス名を指定する. 指定がない場合は "default". +.RE +.PP +\fB \fR\fB\fBAUDIODEV\fR\fR\fB \fR +.RS 3n +(マイク入力で oss デバイス使用時) 録音デバイス名を指定する. 指定がない場合は "\fI/dev/dsp\fR". +.RE +.PP +\fB \fR\fB\fBLATENCY_MSEC\fR\fR\fB \fR +.RS 3n +Linux (alsa/oss) および Windows で,マイク入力時の遅延時間をミ リ秒単位で指定する.短い値を設定することで入力遅延を小さくでき るが,CPU の負荷が大きくなり,また環境によってはプロセスやOSの 挙動が不安定になることがある.最適な値はOS やデバイスに大きく 依存する.デフォルト値は動作環境に依存する. +.RE +.SH "ENVIRONMENT VARIABLES" +.PP +\fB \fR\fB\fBALSADEV\fR\fR\fB \fR +.RS 3n +(マイク入力で alsa デバイス使用時) 録音デバイス名を指定する. 指定がない場合は "default". +.RE +.PP +\fB \fR\fB\fBAUDIODEV\fR\fR\fB \fR +.RS 3n +(マイク入力で oss デバイス使用時) 録音デバイス名を指定する. 指定がない場合は "\fI/dev/dsp\fR". +.RE +.PP +\fB \fR\fB\fBLATENCY_MSEC\fR\fR\fB \fR +.RS 3n +Linux (alsa/oss) および Windows で,マイク入力時の遅延時間をミ リ秒単位で指定する.短い値を設定することで入力遅延を小さくでき るが,CPU の負荷が大きくなり,また環境によってはプロセスやOSの 挙動が不安定になることがある.最適な値はOS やデバイスに大きく 依存する.デフォルト値は動作環境に依存する. +.RE +.SH "EXAMPLES" +.PP +使用例については付属のチュートリアルをご覧下さい. +.SH "SEE ALSO" +.PP +\fBjulian\fR(1), +\fBjcontrol\fR(1), +\fBadinrec\fR(1), +\fBadintool\fR(1), +\fBmkbingram\fR(1), +\fBmkbinhmm\fR(1), +\fBmkgsmm\fR(1), wav2\fBmfcc\fR(1), +\fBmkss\fR(1) +.PP +[1]\&\fIhttp://julius.sourceforge.jp/\fR +.SH "DIAGNOSTICS" +.PP +正常終了した場合,Julius は exit status として 0 を返します.エラーが見付かった場合は異常終了し, exist status として 1 を返します. 入力ファイルが見つからない場合やうまく読み込めなかった場合は,そのファ イルに対する処理をスキップします. +.SH "BUGS" +.PP +使用できるモデルにはサイズやタイプに若干の制限があります.詳しく はパッケージに付属のドキュメントを参照してください. バグ報告・問い合わせ・コメントなどは julius\-info at lists.sourceforge.jp までお願いします. +.SH "COPYRIGHT" +.PP +Copyright (c) 1991\-2008 京都大学 河原研究室 +.PP +Copyright (c) 1997\-2000 情報処理振興事業協会(IPA) +.PP +Copyright (c) 2000\-2008 奈良先端科学技術大学院大学 鹿野研究室 +.PP +Copyright (c) 2005\-2008 名古屋工業大学 Julius開発チーム +.SH "AUTHORS" +.PP +Rev.1.0 (1998/02/20) +.RS 3n +設計:河原達也と李 晃伸 (京都大学) +.sp +実装:李 晃伸 (京都大学) +.RE +.PP +Rev.1.1 (1998/04/14), Rev.1.2 (1998/10/31), Rev.2.0 (1999/02/20), Rev.2.1 (1999/04/20), Rev.2.2 (1999/10/04), Rev.3.0 (2000/02/14), Rev.3.1 (2000/05/11) +.RS 3n +実装:李 晃伸 (京都大学) +.RE +.PP +Rev.3.2 (2001/08/15), Rev.3.3 (2002/09/11), Rev.3.4 (2003/10/01), Rev.3.4.1 (2004/02/25), Rev.3.4.2 (2004/04/30) +.RS 3n +実装:李 晃伸 (奈良先端科学技術大学院大学) +.RE +.PP +Rev.3.5 (2005/11/11), Rev.3.5.1 (2006/03/31), Rev.3.5.2 (2006/07/31), Rev.3.5.3 (2006/12/29), Rev.4.0 (2007/12/19), Rev.4.1 (2008/09) +.RS 3n +実装:李 晃伸 (名古屋工業大学) +.RE +.SH "THANKS TO" +.PP +このプログラムは Rev.3.1 まで,情報処理振興事業協会(IPA)独創的情報技術育 成事業「日本語ディクテーションの基本ソフトウェアの開発」(代表者:鹿野 清宏 奈良先端科学技術大学院大学教授)の援助を受けて行われました. Rev.3.4.2までは「情報処理学会 連続音声認識コンソーシアム」において公開さ れました. +.PP +3.x 時代のマルチプラットフォーム DLL版 は,板野秀樹氏(現名城大学)の手 によって作成・公開されました.また,Windows Microsoft Speech API対応版は 住吉貴志氏(京都大学・当時)の手によるものです. +.PP +そのほか,上記の協力・貢献してくださった方々,およびさまざまな助言・コ メントをいただく関係者各位に深く感謝いたします. +.SH "REFERENCES" +.TP 3 +1.\ http://julius.sourceforge.jp/ +\%http://julius.sourceforge.jp/en/ Index: julius4/man/ja/mkbingram.1 diff -u /dev/null julius4/man/ja/mkbingram.1:1.1 --- /dev/null Thu Oct 2 17:23:48 2008 +++ julius4/man/ja/mkbingram.1 Thu Oct 2 17:23:48 2008 @@ -0,0 +1,85 @@ +.\" Title: + mkbingram + +.\" Author: +.\" Generator: DocBook XSL Stylesheets v1.71.0 +.\" Date: 10/02/2008 +.\" Manual: +.\" Source: +.\" +.TH "MKBINGRAM" "1" "10/02/2008" "" "" +.\" disable hyphenation +.nh +.\" disable justification (adjust text to left margin only) +.ad l +.SH "名前" + + mkbingram + \- バイナリ N\-gram 変換 +.SH "概要" +.HP 10 +\fBmkbingram\fR [\-nlr\ \fIforward_ngram.arpa\fR] [\-nrl\ \fIbackward_ngram.arpa\fR] [\-d\ \fIold_bingram_file\fR] {output_bingram_file} +.SH "DESCRIPTION" +.PP +mkbingram は,ARPA形式の N\-gram 定義ファイルをJulius用のバイナリN\-gram ファイルに変換するツールです.あらかじめ変換しておくことで,Juliusの起 動を大幅に高速化できます. +.PP +Julius\-4より,N\-gram は前向き,後ろ向き,あるいは両方を指定できるよう になりました.mkbingram でも,どちらか一方だけでバイナリN\-gramを作成するこ とができます.また,両方を指定した場合は,それら2つのN\-gramは一つのバ イナリN\-gramに結合されます. +.PP +前向きN\-gramのみが指定されたとき,mkbingram は 前向きN\-gramだけからバ イナリN\-gramを生成します.このバイナリN\-gramを使うとき,Julius はその 中の 2\-gram を使って第1パスを行い,第2 パ スではその前向き確率から後向 きの確率を,ベイズ則に従って算出しながら認識を行います. +.PP +後向きN\-gramのみが指定されたとき,mkbingramは後ろ向きN\-gramだけからバ イナリN\-gramを生成します.このバイナリN\-gramを使うとき,Julius はその 中の後向き 2\-gram からベイズ則に従って算出しながら第1パスの認識を行い, 第2パスでは後向き N\-gramを使った認識を行います. +.PP +両方が指定されたときは,前向きN\-gram中の2\-gramと後向きN\-gramが統合され たバイナリN\-gramが生成されます.Juliusではその前向き2\-gramで第1パスを 行い,後向きN\-gramで第2パスを行います.なお両 N\-gram は同一のコーパス から同 一の条件(カットオフ値,バックオフ計算方法等)で学習されてあり, 同一の語彙を持っている必要があります. +.PP +なお,mkbingram は gzip 圧縮された ARPA ファイルもそのまま読み込めます. +.PP +バージョン 3.x 以前で作成したバイナリN\-gramは,そのまま 4.0 でも読めま す.mkbingram に +\fB\-d\fR +で与えることで,古いバイナリ形式 を新しいバイナリ形式に変換することもできます.なお,4.0 以降の mkbingram で作成したバイナリN\-gramファイルは3.x 以前のバージョンでは 使えませんのでご注意ください. +.SH "OPTIONS" +.PP +\fB \-nlr \fR \fIforward_ngram.arpa\fR +.RS 3n +前向き(left\-to\-right)のARPA形式 N\-gram ファイルを読み込む +.RE +.PP +\fB \-nrl \fR \fIbackward_ngram.arpa\fR +.RS 3n +後ろ向き(right\-to\-left)のARPA形式 N\-gram ファイルを読み込む +.RE +.PP +\fB \-d \fR \fIold_bingram_file\fR +.RS 3n +バイナリN\-gramを読み込む(古いバイナリ形式の変換用) +.RE +.PP +\fIoutput_bingram_file\fR +.RS 3n +出力先のバイナリN\-gramファイル名 +.RE +.SH "EXAMPLES" +.PP +ARPA形式の N\-gram をバイナリ形式に変換する(前向き+後ろ向き): +.sp .RS 3n .nf % \fBmkbingram\fR \-nlr 2gram.arpa \-nrl rev\-Ngram.arpa outfile .fi .RE +ARPA形式の前向き 4\-gram をバイナリ形式に変換する(前向きのみ): +.sp .RS 3n .nf % \fBmkbingram\fR \-nlr 4gram.arpa outfile .fi .RE +古いバイナリN\-gramファイルを現在の形式に変換する: +.sp .RS 3n .nf % \fBmkbingram\fR \-d old_bingram new_bingram .fi .RE +.SH "SEE ALSO" +.PP + +\fB julius \fR( 1 ) +, +\fB mkbinhmm \fR( 1 ) +.SH "COPYRIGHT" +.PP +Copyright (c) 1991\-2008 京都大学 河原研究室 +.PP +Copyright (c) 1997\-2000 情報処理振興事業協会(IPA) +.PP +Copyright (c) 2000\-2008 奈良先端科学技術大学院大学 鹿野研究室 +.PP +Copyright (c) 2005\-2008 名古屋工業大学 Julius開発チーム +.SH "LICENSE" +.PP +Julius の使用許諾に準じます. Index: julius4/man/ja/mkbinhmm.1 diff -u /dev/null julius4/man/ja/mkbinhmm.1:1.1 --- /dev/null Thu Oct 2 17:23:48 2008 +++ julius4/man/ja/mkbinhmm.1 Thu Oct 2 17:23:48 2008 @@ -0,0 +1,73 @@ +.\" Title: + mkbinhmm + +.\" Author: +.\" Generator: DocBook XSL Stylesheets v1.71.0 +.\" Date: 10/02/2008 +.\" Manual: +.\" Source: +.\" +.TH "MKBINHMM" "1" "10/02/2008" "" "" +.\" disable hyphenation +.nh +.\" disable justification (adjust text to left margin only) +.ad l +.SH "名前" + + mkbinhmm + \- バイナリ HMM 変換 +.SH "概要" +.HP 9 +\fBmkbinhmm\fR [\-htkconf\ \fIHTKConfigFile\fR] {hmmdefs_file} {binhmm_file} +.SH "DESCRIPTION" +.PP +mkbinhmm は,HTKのアスキー形式のHMM定義ファイルを,Julius用のバイナ リ形式へ変換します.これを使うことで Juliusの起動を高速化することができます. +.PP +この音響モデルの特徴抽出条件を出力ファイルのヘッダに埋め込むことができ ます.埋め込むには,学習時に特徴量抽出に用いた HTK Config ファイルを "\fB\-htkconf\fR" で指定します.ヘッダに抽出条件を埋め込むことで, 認識時に自動的に必要な特徴抽出パラメータがセットされるので,便利です. +.PP +入力として,HTKアスキー形式のほかに,既に変換済みのJulius用バイナリHMM を与えることもできます.\fB\-htkconf\fR +と併用すれば, 既存のバイナリHMMに特徴量抽出条件パラメータを埋め込むことができます. +.PP +mkbinhmm は gzip 圧縮されたHMM定義ファイルをそのまま読み込めます. +.SH "OPTIONS" +.PP +\fB \-htkconf \fR \fIHTKConfigFile\fR +.RS 3n +学習時に特徴量抽出に使用したHTK Configファイルを指定する.指定さ れた場合,その中の設定値が出力ファイルのヘッダに埋め込まれる. 入力に既にヘッダがある場合上書きされる. +.RE +.PP +\fIhmmdefs_file\fR +.RS 3n +変換元の音響モデル定義ファイル (MMF).HTK ASCII 形式,あるいは Julius バイナリ形式. +.RE +.PP +\fIhmmdefs_file\fR +.RS 3n +Julius用バイナリ形式ファイルの出力先. +.RE +.SH "EXAMPLES" +.PP +HTK ASCII 形式の HMM 定義をバイナリ形式に変換する: +.sp .RS 3n .nf % \fBmkbinhmm\fR hmmdefs.ascii binhmm .fi .RE +HTKの設定ファイル Config の内容をヘッダに書き込んで出力: +.sp .RS 3n .nf % \fBmkbinhmm\fR \-htkconf Config hmmdefs.ascii binhmm .fi .RE +古いバイナリ形式ファイルにヘッダ情報だけ追加する: +.sp .RS 3n .nf % \fBmkbingram\fR \-htkconf Config old_binhmm new_binhmm .fi .RE +.SH "SEE ALSO" +.PP + +\fB julius \fR( 1 ) +, +\fB mkbingram \fR( 1 ) +.SH "COPYRIGHT" +.PP +Copyright (c) 1991\-2008 京都大学 河原研究室 +.PP +Copyright (c) 1997\-2000 情報処理振興事業協会(IPA) +.PP +Copyright (c) 2000\-2008 奈良先端科学技術大学院大学 鹿野研究室 +.PP +Copyright (c) 2005\-2008 名古屋工業大学 Julius開発チーム +.SH "LICENSE" +.PP +Julius の使用許諾に準じます. Index: julius4/man/ja/mkbinhmmlist.1 diff -u /dev/null julius4/man/ja/mkbinhmmlist.1:1.1 --- /dev/null Thu Oct 2 17:23:48 2008 +++ julius4/man/ja/mkbinhmmlist.1 Thu Oct 2 17:23:48 2008 @@ -0,0 +1,73 @@ +.\" Title: + mkbinhmmlist + +.\" Author: +.\" Generator: DocBook XSL Stylesheets v1.71.0 +.\" Date: 10/02/2008 +.\" Manual: +.\" Source: +.\" +.TH "MKBINHMMLIST" "1" "10/02/2008" "" "" +.\" disable hyphenation +.nh +.\" disable justification (adjust text to left margin only) +.ad l +.SH "名前" + + mkbinhmmlist + \- HMMList ファイルをバイナリ形式に変換 +.SH "概要" +.HP 13 +\fBmkbinhmmlist\fR {hmmdefs_file} {HMMList_file} {output_binhmmlist_file} +.SH "DESCRIPTION" +.PP +mkbinhmmlist は,主にトライフォンとともに使用される HMMList ファイルを バイナリ形式に変換します.通常のテキスト形式の代わりにこれを使うことで Juliusの起動を高速化することができます. +.PP +変換には,HMMList ファイルのほかに,一緒に使う音響モデル定義ファイル +\fIhmmdefs_file\fR +が必要です(HTK ASCII形式 / Juliusバイナリ形式のどちらも可). +.PP +Julius で使用する際には,通常のテキスト形式と同じく "\fB\-hlist\fR" オプションで指定します. テキスト形式かバイナリ形式かの判定は Julius 側で自動的に行われます. +.PP +mkbinhmmlist は gzip 圧縮されたファイルをそのまま読み込めます. +.SH "OPTIONS" +.PP +\fIhmmdefs_file\fR +.RS 3n +音響モデル定義ファイル.HTK ASCII 形式,あるいはJulius バイナ リ形式. +.RE +.PP +\fIHMMList_file\fR +.RS 3n +変換対象の HMMList ファイル. +.RE +.PP +\fIoutput_binhmmlist_file\fR +.RS 3n +出力先となるJulius用バイナリ形式HMMListファイル.すでに ある場合は上書きされる. +.RE +.SH "EXAMPLES" +.PP +HMMList ファイル +\fIlogicalTri\fRをバイナリ形式に変換して +\fIlogicalTri.bin\fR +に保存する: +.sp .RS 3n .nf % \fBmkbinhmmlist\fR binhmm logicalTri logicalTri.bin .fi .RE +.SH "SEE ALSO" +.PP + +\fB julius \fR( 1 ) +, +\fB mkbinhmm \fR( 1 ) +.SH "COPYRIGHT" +.PP +Copyright (c) 1991\-2008 京都大学 河原研究室 +.PP +Copyright (c) 1997\-2000 情報処理振興事業協会(IPA) +.PP +Copyright (c) 2000\-2008 奈良先端科学技術大学院大学 鹿野研究室 +.PP +Copyright (c) 2005\-2008 名古屋工業大学 Julius開発チーム +.SH "LICENSE" +.PP +Julius の使用許諾に準じます. Index: julius4/man/ja/mkdfa.pl.1 diff -u /dev/null julius4/man/ja/mkdfa.pl.1:1.1 --- /dev/null Thu Oct 2 17:23:48 2008 +++ julius4/man/ja/mkdfa.pl.1 Thu Oct 2 17:23:48 2008 @@ -0,0 +1,95 @@ +.\" Title: + mkdfa.pl + +.\" Author: +.\" Generator: DocBook XSL Stylesheets v1.71.0 +.\" Date: 10/02/2008 +.\" Manual: +.\" Source: +.\" +.TH "MKDFA.PL" "1" "10/02/2008" "" "" +.\" disable hyphenation +.nh +.\" disable justification (adjust text to left margin only) +.ad l +.SH "名前" + + mkdfa.pl + \- Julius 形式の文法をオートマトンに変換するコンパイラ +.SH "概要" +.HP 9 +\fBmkdfa.pl\fR [\fIoptions\fR...] {prefix} +.SH "DESCRIPTION" +.PP +mkdfa.pl は Julius の文法コンパイラです.記述された文法ファイル (.grammar) と語彙ファイル (.voca) から,Julius用の有限状態オートマトン ファイル (.dfa) および認識辞書 (.dict) を生成します.カテゴリ名と生成 後の各ファイルで用いられるカテゴリ ID 番号との対応が .term ファイルと して出力されます. +.PP +各ファイル形式の詳細については,別途ドキュメントをご覧下さい. +.PP + +prefix +は,.grammar ファイルおよび .vocaファイルの プレフィックスを引数として与えます.prefix.grammarと +prefix.vocaからprefix.dfa, +prefix.dictおよび +prefix.termが生成されます. +.PP +バージョン 3.5.3 以降の Julius に付属の +\fBmkdfa.pl\fR +は, +\fBdfa_minimize\fR +を内部で自動的に呼び出すので, 出力される .dfa は常に最小化されています. +.SH "OPTIONS" +.PP +\fB \-n \fR +.RS 3n +辞書を出力しない..voca 無しで .grammar のみを .dfa に変換する ことができる. +.RE +.SH "ENVIRONMENT VARIABLES" +.PP +\fB \fR\fB\fBTMP\fR\fR\fB または \fR\fB\fBTEMP\fR\fR\fB \fR +.RS 3n +変換中に一時ファイルを置くディレクトリを指定する. 指定が無い場合, +\fI/tmp\fR, +\fI/var/tmp\fR, +\fI/WINDOWS/Temp\fR, +\fI/WINNT/Temp\fR +の順で最初に見つかった場所が使用される. +.RE +.SH "EXAMPLES" +.PP +文法ファイル +\fIfoo.grammar\fR, +\fIfoo.voca\fRに 対して以下を実行することで +\fIfoo.dfa\fRと +\fIfoo.voca\fRおよび\fIfoo.term\fRが出力される. +.sp .RS 3n .nf % \fBmkdfa.pl\fR foo .fi .RE +.SH "SEE ALSO" +.PP + +\fB julius \fR( 1 ) +, +\fB generate \fR( 1 ) +, +\fB nextword \fR( 1 ) +, +\fB accept_check \fR( 1 ) +, +\fB dfa_minimize \fR( 1 ) +.SH "DIAGNOSTICS" +.PP +mkdfa.pl は内部で +\fBmkfa\fR +および +\fBdfa_minimize\fR +を呼び出します.実行時,これらの実行ファ イルが,この mkdfa.pl と同じディレクトリに置いてある必要があります. これらはJulius に同梱されています. +.SH "COPYRIGHT" +.PP +Copyright (c) 1991\-2008 京都大学 河原研究室 +.PP +Copyright (c) 1997\-2000 情報処理振興事業協会(IPA) +.PP +Copyright (c) 2000\-2008 奈良先端科学技術大学院大学 鹿野研究室 +.PP +Copyright (c) 2005\-2008 名古屋工業大学 Julius開発チーム +.SH "LICENSE" +.PP +Julius の使用許諾に準じます. Index: julius4/man/ja/mkgshmm.1 diff -u /dev/null julius4/man/ja/mkgshmm.1:1.1 --- /dev/null Thu Oct 2 17:23:48 2008 +++ julius4/man/ja/mkgshmm.1 Thu Oct 2 17:23:48 2008 @@ -0,0 +1,53 @@ +.\" Title: + mkgshmm + +.\" Author: +.\" Generator: DocBook XSL Stylesheets v1.71.0 +.\" Date: 10/02/2008 +.\" Manual: +.\" Source: +.\" +.TH "MKGSHMM" "1" "10/02/2008" "" "" +.\" disable hyphenation +.nh +.\" disable justification (adjust text to left margin only) +.ad l +.SH "名前" + + mkgshmm + \- モノフォンHMMを GMS 用に変換する +.SH "概要" +.HP 8 +\fBmkgshmm\fR {monophone_hmmdefs} + > + {outputfile} +.SH "DESCRIPTION" +.PP +mkgshmm はHTK形式のmonophone HMMを Julius の Gaussian Mixture Selection (GMS) 用に変換するperlスクリプトです. +.PP +GMSはJulius\-3.2からサポートされている音響尤度計算の高速化手法です. フレームごとに monophone の状態尤度に基づいてtriphoneやPTMの状態を予 備選択することで,音響尤度計算が高速化されます. +.SH "EXAMPLES" +.PP +まずターゲットとするtriphoneやPTMに対して,同じコーパスで学習した monophone モデルを用意します. +.PP +次にそのmonophoneモデルを mkgshmm を用いて GMS 用に変換します. +.sp .RS 3n .nf % \fBmkgshmm\fR monophone > gshmmfile .fi .RE +これを Julius で "\fB\-gshmm\fR" で指定します. +.sp .RS 3n .nf % \fBjulius\fR \-C ... \-gshmm gshmmfile .fi .RE +GMS用モデルはtriphoneやPTMと同一のコーパスから作成する必要がある点に注 意してください.gshmm がミスマッチだと選択誤りが生じ,性能が劣化します. +.SH "SEE ALSO" +.PP + +\fB julius \fR( 1 ) +.SH "COPYRIGHT" +.PP +Copyright (c) 1991\-2008 京都大学 河原研究室 +.PP +Copyright (c) 1997\-2000 情報処理振興事業協会(IPA) +.PP +Copyright (c) 2000\-2008 奈良先端科学技術大学院大学 鹿野研究室 +.PP +Copyright (c) 2005\-2008 名古屋工業大学 Julius開発チーム +.SH "LICENSE" +.PP +Julius の使用許諾に準じます. Index: julius4/man/ja/mkss.1 diff -u /dev/null julius4/man/ja/mkss.1:1.1 --- /dev/null Thu Oct 2 17:23:48 2008 +++ julius4/man/ja/mkss.1 Thu Oct 2 17:23:48 2008 @@ -0,0 +1,63 @@ +.\" Title: + mkss + +.\" Author: +.\" Generator: DocBook XSL Stylesheets v1.71.0 +.\" Date: 10/02/2008 +.\" Manual: +.\" Source: +.\" +.TH "MKSS" "1" "10/02/2008" "" "" +.\" disable hyphenation +.nh +.\" disable justification (adjust text to left margin only) +.ad l +.SH "名前" + + mkss + \- スペクトルサブトラクション用のノイズスペクトル計算 +.SH "概要" +.HP 5 +\fBmkss\fR [\fIoptions\fR...] {filename} +.SH "DESCRIPTION" +.PP +mkss は,スペクトルサブトラクション用のノイズスペクトル計算ツールです. 指定時間分の音声のない雑音音声をマイク入力から録音し, その短時間スペクトラムの平均を ファイルに出力します.出力されたファイルは,Julius でスペクトル サブトラクションのためのノイズスペクトルファイル(オプション "\fB\-ssload\fR")として使用できます. +.PP +録音は起動と同時に開始します.サンプリング条件は16bit signed short (big endian), monoral で固定です.既に同じ名前のファイルが存在する場合 は上書きします.また,ファイル名に "\-" を指定するこ とで標準出力へ出力できます. +.SH "OPTIONS" +.PP +\fB \-freq \fR \fIHz\fR +.RS 3n +音声のサンプリング周波数 (Hz) を指定する.(default: 16,000) +.RE +.PP +\fB \-len \fR \fImsec\fR +.RS 3n +録音する時間長をミリ秒単位で指定する(default: 3000) +.RE +.PP +\fB \-fsize \fR \fIsample_num\fR +.RS 3n +窓サイズをサンプル数で指定 (default: 400). +.RE +.PP +\fB \-fshift \fR \fIsample_num\fR +.RS 3n +フレームシフト幅をサンプル数で指定 (default: 160). +.RE +.SH "SEE ALSO" +.PP + +\fB julius \fR( 1 ) +.SH "COPYRIGHT" +.PP +Copyright (c) 1991\-2008 京都大学 河原研究室 +.PP +Copyright (c) 1997\-2000 情報処理振興事業協会(IPA) +.PP +Copyright (c) 2000\-2008 奈良先端科学技術大学院大学 鹿野研究室 +.PP +Copyright (c) 2005\-2008 名古屋工業大学 Julius開発チーム +.SH "LICENSE" +.PP +Julius の使用許諾に準じます. Index: julius4/man/ja/nextword.1 diff -u /dev/null julius4/man/ja/nextword.1:1.1 --- /dev/null Thu Oct 2 17:23:48 2008 +++ julius4/man/ja/nextword.1 Thu Oct 2 17:23:48 2008 @@ -0,0 +1,104 @@ +.\" Title: + nextword + +.\" Author: +.\" Generator: DocBook XSL Stylesheets v1.71.0 +.\" Date: 10/02/2008 +.\" Manual: +.\" Source: +.\" +.TH "NEXTWORD" "1" "10/02/2008" "" "" +.\" disable hyphenation +.nh +.\" disable justification (adjust text to left margin only) +.ad l +.SH "名前" + + nextword + \- DFA 文法で(逆向きに)次単語を予測するツール +.SH "概要" +.HP 9 +\fBnextword\fR [\-t] [\-r] [\-s\ \fIspname\fR] [\-v] {prefix} +.SH "DESCRIPTION" +.PP +nextword は,\fBmkdfa.pl\fR +によって変換された DFA 文法 上で,与えられた部分文に対して接続しうる次単語の集合を出力します. +.PP +実行には .dfa, .dict, .term の各ファイルが必要です. あらかじめ +\fBmkdfa.pl\fR +で生成しておいて下さい. +.PP +!注意! +\fBmkdfa.pl\fR +で出力される文法は,元の 文法と異なり,文の後ろから前に向かう逆向きの文法となっています. これは,Julius の第2パスで後ろ向きの探索を行うためです. このため,nextword で与える部分文も逆向きとなります. +.SH "OPTIONS" +.PP +\fB \-t \fR +.RS 3n +単語ではなくカテゴリ名で入力・出力する. +.RE +.PP +\fB \-r \fR +.RS 3n +単語を逆順に入力する. +.RE +.PP +\fB \-s \fR \fIspname\fR +.RS 3n +スキップすべきショートポーズ単語の名前を指定する. (default: "sp") +.RE +.PP +\fB \-v \fR +.RS 3n +デバッグ出力. +.RE +.SH "EXAMPLES" +.PP +vfr (フィッティングタスク用文法) での実行例: +.sp +.RS 3n +.nf +% nextword vfr +Reading in dictionary...done +Reading in DFA grammar...done +Mapping dict item <\-> DFA terminal (category)...done +Reading in term file (optional)...done +42 categories, 99 words +DFA has 135 nodes and 198 arcs +\-\-\-\-\- +wseq > に して 下さい silE +[wseq: に して 下さい silE] +[cate: (NI|NI_AT) SURU_V KUDASAI_V NS_E] +PREDICTED CATEGORIES/WORDS: + KEIDOU_A (派手 地味 ) + BANGOU_N (番 ) + HUKU_N (服 服装 服装 ) + PATTERN_N (チェック 縦縞 横縞 ...) + GARA_N (柄 ) + KANZI_N (感じ ) + IRO_N (色 ) + COLOR_N (赤 橙 黄 ...) +wseq > +.fi +.RE +.sp +.SH "SEE ALSO" +.PP + +\fB mkdfa.pl \fR( 1 ) +, +\fB generate \fR( 1 ) +, +\fB accept_check \fR( 1 ) +.SH "COPYRIGHT" +.PP +Copyright (c) 1991\-2008 京都大学 河原研究室 +.PP +Copyright (c) 1997\-2000 情報処理振興事業協会(IPA) +.PP +Copyright (c) 2000\-2008 奈良先端科学技術大学院大学 鹿野研究室 +.PP +Copyright (c) 2005\-2008 名古屋工業大学 Julius開発チーム +.SH "LICENSE" +.PP +Julius の使用許諾に準じます. From sumomo @ users.sourceforge.jp Fri Oct 3 00:00:37 2008 From: sumomo @ users.sourceforge.jp (sumomo @ users.sourceforge.jp) Date: Fri, 03 Oct 2008 00:00:37 +0900 Subject: [Julius-cvs 313] CVS update: julius4 Message-ID: <1222959637.529507.2350.nullmailer@users.sourceforge.jp> Index: julius4/00readme-ja.txt diff -u julius4/00readme-ja.txt:1.5 julius4/00readme-ja.txt:1.6 --- julius4/00readme-ja.txt:1.5 Sun Sep 28 00:33:44 2008 +++ julius4/00readme-ja.txt Fri Oct 3 00:00:37 2008 @@ -4,7 +4,7 @@ Julius - (Rev 4.1 2008/09/xx) + (Rev 4.1 2008/10/03) (Rev 4.0.2 2008/05/27) (Rev 4.0 2007/12/19) (Rev 3.5.3 2006/12/29) @@ -33,7 +33,7 @@ Julius-4.1 -============= +=========== 4.0 ?? 4.0.2 ?????????????C??????????? ???????????????? "-fallback1pass" ? "-usepower" ? @@ -45,14 +45,25 @@ ???????????????? perl ????? "jclient-perl" ? ???????? -??? 4.1 ???????????????????????????タ? -???????????タ??????????????? -?????? "plugin" ???????????????????????? -?????????????????????????????? -????????????R?????????????C?????????? +4.1 ????????????????????????????????? +???????????????????????タ??????????? +??????????????????????????????????? +?????? "plugin" ???????????????????????? +???????????????????????????????????+????????????????? + +???Julius ???????????? "The Juliusbook" ??????? +???????????????????????? Docbook XML ??????+??html ?? pdf ?????????????????????????? +???????????????????????? 4.1 ???????? +????????????????????????Julius???????? +????????????????? + +Juliusbook ???????????????????? ??????_????????Release-ja.txt ??????? + ??????? =============== @@ -75,6 +86,7 @@ mkss/ ????????????c?? mkss jclient-perl/ A simple perl version of module mode client plugin/ ?????????????????????+ man/ ?????? support/ ???????? Index: julius4/00readme.txt diff -u julius4/00readme.txt:1.5 julius4/00readme.txt:1.6 --- julius4/00readme.txt:1.5 Sun Sep 28 00:33:44 2008 +++ julius4/00readme.txt Fri Oct 3 00:00:37 2008 @@ -4,7 +4,7 @@ Julius - (Rev 4.1 2008/09/xx) + (Rev 4.1 2008/10/03) (Rev 4.0.2 2008/05/27) (Rev 4.0 2007/12/19) (Rev 3.5.3 2006/12/29) @@ -22,17 +22,22 @@ About Julius ============= -"Julius" is a high-performance, two-pass large vocabulary continuous -speech recognition (LVCSR) decoder software for speech-related -researches and developments. It supports N-gram based dictataion (N -unlimited) , DFA grammar based parsing, and one-pass isolated word -recognition. Phone context dependencies are supported up to triphone. -It can perform a multi-model decoding, a recognition using several LMs -and AMs simultaneously with a single processor, and also support for -"hot plugging" of arbitrary modules at run time. The core engine is -implemented as a C library along with a simple API, which can be -easily integrated into various applications. Standard model formats -for famous tools such as HTK, CMU-Cam SLM toolkit, etc. are adopted. +"Julius" is an open-source high-performance large vocabulary +continuous speech recognition (LVCSR) decoder software for +speech-related researchers and developers. Based on word N-gram and +triphone context-dependent HMM, it can perform almost real-time +decoding on most current PCs with small amount of memory. + +It also has high vesatility. The acoustic models and language models +are pluggable, and you can build various types of speech recognition +system by building your own models and modules to be suitable for your +task. It also adopts standard formats to cope with other toolkit such +as HTK, CMU-Cam SLM toolkit, etc. + +The core engine is implemented as embeddable library, to aim to offer +speech recognition capability to various applications. The recent +version supports plug-in capability so that the engine can be extended +by user. The main platform is Linux and other Unix workstations, and also works on Windows (SAPI/console). Julius is distributed with open license @@ -40,7 +45,7 @@ What's new in Julius-4.1 -=========================== +========================== From 4.0 to 4.0.2, many bugs are fixed and small improvements were done. New options "-fallback1pass" and "-usepower" were added. The @@ -50,15 +55,23 @@ for VTLN are all supported. "jclient-perl", a perl version of module mode client, is newly added. -A great forward-steps have been made by implementing a plugin -capability. It enables run-time, easy extension of decoder. -The directory "plugin" contains several example source codes and -ready to compile and test them. The source codes also contain all -function specification documents. +Plug-in support is newly implemented on rev. 4.1. Using dynamic +object linking, Julius now can load extensions at run time, and extend +its ability easily without modifying the original engine source code. +The directory "plugin" contains several example source codes and ready +to compile and test them. The source codes also contain all function +specification documents. + +From this release, you can get the total documentation of Julius +called "Juliusbook". It is written in Docbook XML, and PDF version +and HTML version is available. At this time English version has only +the option descriptions and online manuals. Full version that +explains all aspects and specification of Julius (models, input, +decoding, etc...) will be released within a short term. Contents of Julius-4.1 -========================= +======================== (Documents with suffix "ja" are written in Japanese) @@ -82,6 +95,7 @@ support/ some tools to compile julius/julian from source jclient-perl/ A simple perl version of module mode client plugin/ Several plugin source codes and documentation + man/ Unix online manuals olddoc/ ChangeLogs before 3.2 Index: julius4/Release-ja.txt diff -u julius4/Release-ja.txt:1.5 julius4/Release-ja.txt:1.6 --- julius4/Release-ja.txt:1.5 Sun Sep 28 00:33:44 2008 +++ julius4/Release-ja.txt Fri Oct 3 00:00:37 2008 @@ -36,6 +36,11 @@ - HMM ???????HMM?????? 256, ???????P? - ??????????????????????? +??????? + - "Juliusbook" ????? (pdf / html) + - ??????????man ???????????D + ?????????????????????? + 4.0.2 (2008.5.27) ================== Index: julius4/Release.txt diff -u julius4/Release.txt:1.5 julius4/Release.txt:1.6 --- julius4/Release.txt:1.5 Sun Sep 28 00:33:44 2008 +++ julius4/Release.txt Fri Oct 3 00:00:37 2008 @@ -36,6 +36,10 @@ maximum HMM name length = 256 char, Number of HMM states unlimited. - Module mode error message on grammar command. +Documents: + - Alpha version of "Juliusbook" (contains only manuals at this time) + - Unix manuals are moved to "man" directory. + 4.0.2 (2008.5.27) ================== From sumomo @ users.sourceforge.jp Fri Oct 3 00:01:59 2008 From: sumomo @ users.sourceforge.jp (sumomo @ users.sourceforge.jp) Date: Fri, 03 Oct 2008 00:01:59 +0900 Subject: [Julius-cvs 314] CVS update: julius4/libjulius Message-ID: <1222959719.652611.4582.nullmailer@users.sourceforge.jp> Index: julius4/libjulius/Makefile.in diff -u julius4/libjulius/Makefile.in:1.5 julius4/libjulius/Makefile.in:1.6 --- julius4/libjulius/Makefile.in:1.5 Thu Oct 2 17:57:03 2008 +++ julius4/libjulius/Makefile.in Fri Oct 3 00:01:59 2008 @@ -5,7 +5,7 @@ # All rights reserved # -# $Id: Makefile.in,v 1.5 2008/10/02 08:57:03 sumomo Exp $ +# $Id: Makefile.in,v 1.6 2008/10/02 15:01:59 sumomo Exp $ # SHELL=/bin/sh .SUFFIXES: @@ -97,9 +97,9 @@ ${INSTALL} -d ${includedir}/julius ${INSTALL_DATA} include/julius/*.h ${includedir}/julius -install.bin: libjulius-config +install.bin: libjulius-config-dist ${INSTALL} -d ${bindir} - ${INSTALL_PROGRAM} libjulius-config ${bindir} + ${INSTALL_PROGRAM} libjulius-config-dist ${bindir}/libjulius-config depend: makedepend -- $(CFLAGS) -- $(OBJSENT) @@ -117,7 +117,7 @@ $(RM) config.log config.cache $(RM) $(TARGET) $(RM) src/version.c - $(RM) libjulius-config + $(RM) libjulius-config libjulius-config-dist $(RM) doxygen.conf.ver $(RM) config.status include/julius/config.h $(RM) Makefile Index: julius4/libjulius/configure diff -u julius4/libjulius/configure:1.5 julius4/libjulius/configure:1.6 --- julius4/libjulius/configure:1.5 Thu Sep 25 14:00:04 2008 +++ julius4/libjulius/configure Fri Oct 3 00:01:59 2008 @@ -592,7 +592,7 @@ JULIUS_PRODUCTNAME=JuliusLib -JULIUS_VERSION=4.0.2 +JULIUS_VERSION=4.1 # Check whether --enable-pthread or --disable-pthread was given. @@ -1926,7 +1926,7 @@ ac_given_srcdir=$srcdir ac_given_INSTALL="$INSTALL" -trap 'rm -fr `echo "Makefile libjulius-config src/version.c doxygen.conf.ver include/julius/config.h" | sed "s/:[^ ]*//g"` conftest*; exit 1' 1 2 15 +trap 'rm -fr `echo "Makefile libjulius-config libjulius-config-dist src/version.c doxygen.conf.ver include/julius/config.h" | sed "s/:[^ ]*//g"` conftest*; exit 1' 1 2 15 EOF cat >> $CONFIG_STATUS <> $CONFIG_STATUS <> $CONFIG_STATUS <<\EOF for ac_file in .. $CONFIG_FILES; do if test "x$ac_file" != x..; then @@ -2187,7 +2187,7 @@ EOF cat >> $CONFIG_STATUS <<\EOF -chmod +x libjulius-config +chmod +x libjulius-config libjulius-config-dist exit 0 Index: julius4/libjulius/configure.in diff -u julius4/libjulius/configure.in:1.5 julius4/libjulius/configure.in:1.6 --- julius4/libjulius/configure.in:1.5 Thu Sep 25 14:00:04 2008 +++ julius4/libjulius/configure.in Fri Oct 3 00:01:59 2008 @@ -4,7 +4,7 @@ dnl Copyright (c) 2005-2007 Julius project team, Nagoya Institute of Technology dnl All rights reserved dnl -dnl $Id: configure.in,v 1.5 2008/09/25 05:00:04 sumomo Exp $ +dnl $Id: configure.in,v 1.6 2008/10/02 15:01:59 sumomo Exp $ dnl AC_INIT(src/search_bestfirst_main.c) @@ -12,7 +12,7 @@ AC_CONFIG_AUX_DIR(../support) JULIUS_PRODUCTNAME=JuliusLib -JULIUS_VERSION=4.0.2 +JULIUS_VERSION=4.1 dnl Checks for options @@ -385,6 +385,6 @@ AC_SUBST(easy_setup) AC_OUTPUT_COMMANDS( -[chmod +x libjulius-config +[chmod +x libjulius-config libjulius-config-dist ]) -AC_OUTPUT(Makefile libjulius-config src/version.c doxygen.conf.ver) +AC_OUTPUT(Makefile libjulius-config libjulius-config-dist src/version.c doxygen.conf.ver) Index: julius4/libjulius/libjulius-config-dist.in diff -u /dev/null julius4/libjulius/libjulius-config-dist.in:1.1 --- /dev/null Fri Oct 3 00:01:59 2008 +++ julius4/libjulius/libjulius-config-dist.in Fri Oct 3 00:01:59 2008 @@ -0,0 +1,61 @@ +#!/bin/sh +# +# libsent configuration result reporter +# +# "libsent-config --cflags" generates C defines, and +# "libsent-config --libs" generates libraries needed for compile with +# the sentlib +# +# by Doshita Lab. Speech Group, Kyoto University 1991-2000 +# by Shikano Lab. Speech Group, NAIST 2002 + +# +# ripped from gtk's gtk-config.in +# +# $Id: libjulius-config-dist.in,v 1.1 2008/10/02 15:01:59 sumomo Exp $ +# + +# +# @configure_input@ +# + +version="\ +Julius/Julian library rev. @ JULIUS_VERSION@" +usage="\ +Usage: libjulius-config [--libs] [--cflags] [--info] [--version]" + +prefix="@prefix@" +exec_prefix="@exec_prefix@" + +if test $# -eq 0; then + echo "${usage}" 1>&2 + exit 1 +fi + +while test $# -gt 0; do + case "$1" in + -*=*) optarg=`echo "$1" | sed 's/[-_a-zA-Z0-9]*=//'` ;; + *) optarg= ;; + esac + + case $1 in + --cflags) + echo -I @ includedir@ @CPPFLAGS@ + ;; + --libs) + echo -L @ libdir@ -ljulius @LDFLAGS@ @LIBS@ + ;; + --version) + echo "${version}" + ;; + *) + echo "${usage}" 1>&2 + exit 1 + ;; + esac + shift +done + +echo + +exit 0 Index: julius4/libjulius/libjulius-config.in diff -u julius4/libjulius/libjulius-config.in:1.3 julius4/libjulius/libjulius-config.in:1.4 --- julius4/libjulius/libjulius-config.in:1.3 Thu Sep 25 13:49:05 2008 +++ julius4/libjulius/libjulius-config.in Fri Oct 3 00:01:59 2008 @@ -12,7 +12,7 @@ # # ripped from gtk's gtk-config.in # -# $Id: libjulius-config.in,v 1.3 2008/09/25 04:49:05 sumomo Exp $ +# $Id: libjulius-config.in,v 1.4 2008/10/02 15:01:59 sumomo Exp $ # # @@ -24,6 +24,9 @@ usage="\ Usage: libjulius-config [--libs] [--cflags] [--info] [--version]" +prefix="@prefix@" +exec_prefix="@exec_prefix@" + if test $# -eq 0; then echo "${usage}" 1>&2 exit 1 From sumomo @ users.sourceforge.jp Fri Oct 3 00:01:59 2008 From: sumomo @ users.sourceforge.jp (sumomo @ users.sourceforge.jp) Date: Fri, 03 Oct 2008 00:01:59 +0900 Subject: [Julius-cvs 315] CVS update: julius4/libsent Message-ID: <1222959719.919402.4598.nullmailer@users.sourceforge.jp> Index: julius4/libsent/Makefile.in diff -u julius4/libsent/Makefile.in:1.7 julius4/libsent/Makefile.in:1.8 --- julius4/libsent/Makefile.in:1.7 Thu Oct 2 17:57:03 2008 +++ julius4/libsent/Makefile.in Fri Oct 3 00:01:59 2008 @@ -3,7 +3,7 @@ # Copyright (c) 2005-2007 Julius project team, Nagoya Institute of Technology # All rights reserved # -# $Id: Makefile.in,v 1.7 2008/10/02 08:57:03 sumomo Exp $ +# $Id: Makefile.in,v 1.8 2008/10/02 15:01:59 sumomo Exp $ # SHELL=/bin/sh @@ -151,9 +151,9 @@ ${INSTALL} -d ${includedir}/sent ${INSTALL_DATA} include/sent/*.h ${includedir}/sent -install.bin: libsent-config +install.bin: libsent-config-dist ${INSTALL} -d ${bindir} - ${INSTALL_PROGRAM} libsent-config ${bindir} + ${INSTALL_PROGRAM} libsent-config-dist ${bindir}/libsent-config clean: $(RM) *~ src/*/*~ src/*/*.o src/*/*/*.o include/sent/*~ @@ -162,7 +162,7 @@ distclean: $(RM) *~ src/*/*~ src/*/*.o src/*/*/*.o include/sent/*~ $(RM) config.log config.cache - $(RM) libsent-config + $(RM) libsent-config libsent-config-dist $(RM) config.status include/sent/config.h $(RM) $(TARGET) $(RM) Makefile Index: julius4/libsent/configure diff -u julius4/libsent/configure:1.9 julius4/libsent/configure:1.10 --- julius4/libsent/configure:1.9 Tue Aug 5 18:49:00 2008 +++ julius4/libsent/configure Fri Oct 3 00:01:59 2008 @@ -561,7 +561,7 @@ ac_configure=$ac_aux_dir/configure # This should be Cygnus configure. -LIBSENT_VERSION=4.0.2 +LIBSENT_VERSION=4.1 # specify mic type # Check whether --with-mictype or --without-mictype was given. @@ -3030,7 +3030,7 @@ ac_given_srcdir=$srcdir ac_given_INSTALL="$INSTALL" -trap 'rm -fr `echo "Makefile libsent-config include/sent/config.h" | sed "s/:[^ ]*//g"` conftest*; exit 1' 1 2 15 +trap 'rm -fr `echo "Makefile libsent-config libsent-config-dist include/sent/config.h" | sed "s/:[^ ]*//g"` conftest*; exit 1' 1 2 15 EOF cat >> $CONFIG_STATUS <> $CONFIG_STATUS <> $CONFIG_STATUS <<\EOF for ac_file in .. $CONFIG_FILES; do if test "x$ac_file" != x..; then @@ -3308,7 +3308,7 @@ EOF cat >> $CONFIG_STATUS <<\EOF -chmod +x libsent-config +chmod +x libsent-config libsent-config-dist ./libsent-config --info Index: julius4/libsent/configure.in diff -u julius4/libsent/configure.in:1.9 julius4/libsent/configure.in:1.10 --- julius4/libsent/configure.in:1.9 Tue Aug 5 18:49:00 2008 +++ julius4/libsent/configure.in Fri Oct 3 00:01:59 2008 @@ -3,7 +3,7 @@ dnl Copyright (c) 2005-2007 Julius project team, Nagoya Institute of Technology dnl All rights reserved dnl -dnl $Id: configure.in,v 1.9 2008/08/05 09:49:00 sumomo Exp $ +dnl $Id: configure.in,v 1.10 2008/10/02 15:01:59 sumomo Exp $ dnl dnl Process this file with autoconf to produce a configure script. @@ -11,7 +11,7 @@ AC_CONFIG_HEADER(include/sent/config.h) AC_CONFIG_AUX_DIR(../support) -LIBSENT_VERSION=4.0.2 +LIBSENT_VERSION=4.1 dnl Checks for options # specify mic type @@ -501,7 +501,7 @@ AC_SUBST(SOUNDLIB) AC_OUTPUT_COMMANDS( -[chmod +x libsent-config +[chmod +x libsent-config libsent-config-dist ./libsent-config --info ], altype=$altype @@ -511,4 +511,4 @@ wavefile_support="$wavefile_support" gzdesc="$gzdesc" ) -AC_OUTPUT(Makefile libsent-config) +AC_OUTPUT(Makefile libsent-config libsent-config-dist) Index: julius4/libsent/libsent-config-dist.in diff -u /dev/null julius4/libsent/libsent-config-dist.in:1.1 --- /dev/null Fri Oct 3 00:01:59 2008 +++ julius4/libsent/libsent-config-dist.in Fri Oct 3 00:01:59 2008 @@ -0,0 +1,86 @@ +#!/bin/sh +# +# libsent configuration result reporter +# +# "libsent-config --cflags" generates C defines, and +# "libsent-config --libs" generates libraries needed for compile with +# the sentlib +# +# by Doshita Lab. Speech Group, Kyoto University 1991-2000 +# by Shikano Lab. Speech Group, NAIST 2002 + +# +# ripped from gtk's gtk-config.in +# +# $Id: libsent-config-dist.in,v 1.1 2008/10/02 15:01:59 sumomo Exp $ +# + +# +# @configure_input@ +# + +sound_inc="@SOUNDINC@" +sound_libs="@SOUNDLIB@ @EXTRALIB@" +version="\ +Julius/Julian libsent library rev. @ LIBSENT_VERSION@" +info="\ +**************************************************************** +Julius/Julian libsent library rev. @ LIBSENT_VERSION@: + +- Audio I/O + primary mic device API : @altype@ (@aldesc@) + supported audio format : @wavefile_support@ + NetAudio support : @use_netaudio@ +- Language Modeling + class N-gram support : @use_class_ngram@ +- Libraries + file decompression by : @gzdesc@ +- Process management + fork on adinnet input : @use_fork@ + + Note: compilation time flags are now stored in \"libsent-config\". + If you link this library, please add output of + \"libsent-config --cflags\" to CFLAGS and + \"libsent-config --libs\" to LIBS. +****************************************************************" +usage="\ +Usage: libsent-config [--libs] [--cflags] [--info] [--version]" + +prefix="@prefix@" +exec_prefix="@exec_prefix@" + +if test $# -eq 0; then + echo "${usage}" 1>&2 + exit 1 +fi + +while test $# -gt 0; do + case "$1" in + -*=*) optarg=`echo "$1" | sed 's/[-_a-zA-Z0-9]*=//'` ;; + *) optarg= ;; + esac + + case $1 in + --cflags) + echo -I @ includedir@ $sound_inc + ;; + --libs) + echo -L @ libdir@ -lsent $sound_libs @LIBS@ -lm + ;; + --version) + echo "${version}" + ;; + --info) + echo "${info}" + ;; + *) + echo "${usage}" 1>&2 + exit 1 + ;; + esac + shift +done + +echo + +exit 0 Index: julius4/libsent/libsent-config.in diff -u julius4/libsent/libsent-config.in:1.4 julius4/libsent/libsent-config.in:1.5 --- julius4/libsent/libsent-config.in:1.4 Thu Sep 25 13:49:05 2008 +++ julius4/libsent/libsent-config.in Fri Oct 3 00:01:59 2008 @@ -12,7 +12,7 @@ # # ripped from gtk's gtk-config.in # -# $Id: libsent-config.in,v 1.4 2008/09/25 04:49:05 sumomo Exp $ +# $Id: libsent-config.in,v 1.5 2008/10/02 15:01:59 sumomo Exp $ # # @@ -46,6 +46,9 @@ usage="\ Usage: libsent-config [--libs] [--cflags] [--info] [--version]" +prefix="@prefix@" +exec_prefix="@exec_prefix@" + if test $# -eq 0; then echo "${usage}" 1>&2 exit 1 From sumomo @ users.sourceforge.jp Fri Oct 3 00:02:00 2008 From: sumomo @ users.sourceforge.jp (sumomo @ users.sourceforge.jp) Date: Fri, 03 Oct 2008 00:02:00 +0900 Subject: [Julius-cvs 316] CVS update: julius4/man Message-ID: <1222959720.110289.4605.nullmailer@users.sourceforge.jp> Index: julius4/man/Makefile.in diff -u julius4/man/Makefile.in:1.1 julius4/man/Makefile.in:1.2 --- julius4/man/Makefile.in:1.1 Thu Oct 2 17:57:03 2008 +++ julius4/man/Makefile.in Fri Oct 3 00:01:59 2008 @@ -3,7 +3,7 @@ # Copyright (c) 2005-2007 Julius project team, Nagoya Institute of Technology # All rights reserved # -# $Id: Makefile.in,v 1.1 2008/10/02 08:57:03 sumomo Exp $ +# $Id: Makefile.in,v 1.2 2008/10/02 15:01:59 sumomo Exp $ # SHELL=/bin/sh RM=@RM@ -f @@ -13,6 +13,11 @@ ############################################################ +all: + @echo Nothing to build + +install: install.man install.man.ja + install.man: ${INSTALL} -d @mandir@/man1 for f in *.1; do \ @@ -30,7 +35,7 @@ ############################################################ clean: - echo nothing to do + @echo Nothing to do distclean: $(RM) Makefile From sumomo @ users.sourceforge.jp Fri Oct 3 00:02:00 2008 From: sumomo @ users.sourceforge.jp (sumomo @ users.sourceforge.jp) Date: Fri, 03 Oct 2008 00:02:00 +0900 Subject: [Julius-cvs 317] CVS update: julius4/support Message-ID: <1222959720.281690.4612.nullmailer@users.sourceforge.jp> Index: julius4/support/build-all.sh diff -u julius4/support/build-all.sh:1.4 julius4/support/build-all.sh:1.5 --- julius4/support/build-all.sh:1.4 Tue May 27 18:16:40 2008 +++ julius4/support/build-all.sh Fri Oct 3 00:02:00 2008 @@ -6,7 +6,7 @@ # # argument: any configure options except "--enable-setup=..." is allowed. # -JULIUS_VERSION=4.0.2 +JULIUS_VERSION=4.1 ###################################################################### From sumomo @ users.sourceforge.jp Fri Oct 3 01:38:40 2008 From: sumomo @ users.sourceforge.jp (sumomo @ users.sourceforge.jp) Date: Fri, 03 Oct 2008 01:38:40 +0900 Subject: [Julius-cvs 318] CVS update: julius4/julius-simple Message-ID: <1222965520.435858.4001.nullmailer@users.sourceforge.jp> Index: julius4/julius-simple/Makefile diff -u julius4/julius-simple/Makefile:1.2 julius4/julius-simple/Makefile:1.3 --- julius4/julius-simple/Makefile:1.2 Thu Sep 25 13:49:05 2008 +++ julius4/julius-simple/Makefile Fri Oct 3 01:38:40 2008 @@ -4,7 +4,16 @@ CC=gcc CFLAGS=-g -O2 -CPPFLAGS=-I. -I$(LIBJULIUS)/include -I$(LIBSENT)/include `$(LIBSENT)/libsent-config --cflags` `$(LIBJULIUS)/libjulius-config --cflags` +#### +#### When using system-installed libraries +#### +# CPPFLAGS=`libjulius-config --cflags` `libsent-config --cflags` +# LDFLAGS=`libjulius-config --libs` `libsent-config --libs` + +#### +#### When using within-package libraries +#### +CPPFLAGS=-I$(LIBJULIUS)/include -I$(LIBSENT)/include `$(LIBSENT)/libsent-config --cflags` `$(LIBJULIUS)/libjulius-config --cflags` LDFLAGS= -L$(LIBJULIUS) `$(LIBJULIUS)/libjulius-config --libs` -L$(LIBSENT) `$(LIBSENT)/libsent-config --libs` ############################################################ From sumomo @ users.sourceforge.jp Fri Oct 3 10:27:11 2008 From: sumomo @ users.sourceforge.jp (sumomo @ users.sourceforge.jp) Date: Fri, 03 Oct 2008 10:27:11 +0900 Subject: [Julius-cvs 319] CVS update: julius4 Message-ID: <1222997231.874774.29003.nullmailer@users.sourceforge.jp> Index: julius4/Release-ja.txt diff -u julius4/Release-ja.txt:1.6 julius4/Release-ja.txt:1.7 --- julius4/Release-ja.txt:1.6 Fri Oct 3 00:00:37 2008 +++ julius4/Release-ja.txt Fri Oct 3 10:27:11 2008 @@ -1,4 +1,4 @@ -4.1 (2008.9.xx) +4.1 (2008.10.3) ================ ?????????????? - ??????????? Index: julius4/Release.txt diff -u julius4/Release.txt:1.6 julius4/Release.txt:1.7 --- julius4/Release.txt:1.6 Fri Oct 3 00:00:37 2008 +++ julius4/Release.txt Fri Oct 3 10:27:11 2008 @@ -1,4 +1,4 @@ -4.1 (2008.9.xx) +4.1 (2008.10.3) ================ New plugin extension: - supported types: From sumomo @ users.sourceforge.jp Sat Oct 4 00:07:08 2008 From: sumomo @ users.sourceforge.jp (sumomo @ users.sourceforge.jp) Date: Sat, 04 Oct 2008 00:07:08 +0900 Subject: [Julius-cvs 320] CVS update: julius4/libsent/src/anlz Message-ID: <1223046428.065826.9785.nullmailer@users.sourceforge.jp> Index: julius4/libsent/src/anlz/strip.c diff -u julius4/libsent/src/anlz/strip.c:1.2 julius4/libsent/src/anlz/strip.c:1.3 --- julius4/libsent/src/anlz/strip.c:1.2 Tue Dec 18 17:45:50 2007 +++ julius4/libsent/src/anlz/strip.c Sat Oct 4 00:07:07 2008 @@ -11,7 +11,7 @@ * @author Akinobu LEE * @date Tue Feb 15 00:30:38 2005 * - * $Revision: 1.2 $ + * $Revision: 1.3 $ * */ /* @@ -63,7 +63,7 @@ } } else { /* deleted (leave uncopied) */ - jlog("Warning: strip: sample %d-%d is invalid, stripped\n", bgn, src-1); + jlog("Warning: strip: sample %d-%d has zero value, stripped\n", bgn, src-1); } } a[dst++] = a[src]; From sumomo @ users.sourceforge.jp Sat Oct 4 00:09:28 2008 From: sumomo @ users.sourceforge.jp (sumomo @ users.sourceforge.jp) Date: Sat, 04 Oct 2008 00:09:28 +0900 Subject: [Julius-cvs 321] CVS update: julius4/libsent/src/wav2mfcc Message-ID: <1223046568.309228.11435.nullmailer@users.sourceforge.jp> Index: julius4/libsent/src/wav2mfcc/para.c diff -u julius4/libsent/src/wav2mfcc/para.c:1.6 julius4/libsent/src/wav2mfcc/para.c:1.7 --- julius4/libsent/src/wav2mfcc/para.c:1.6 Tue Jun 17 10:20:51 2008 +++ julius4/libsent/src/wav2mfcc/para.c Sat Oct 4 00:09:28 2008 @@ -16,7 +16,7 @@ * @author Akinobu Lee * @date Fri Oct 27 14:55:00 2006 * - * $Revision: 1.6 $ + * $Revision: 1.7 $ * */ /* @@ -207,6 +207,8 @@ return FALSE; } + srate = 0.0; + while (getl_fp(buf, 512, fp) != NULL) { p = buf; if (*p == 35) { /* skip comment line */ @@ -228,7 +230,6 @@ /* process arguments */ skipped = FALSE; - srate = 0.0; if (strmatch(d, "SOURCERATE")) { /* -smpPeriod */ srate = atof(a); } else if (strmatch(d, "TARGETRATE")) { /* -fshift */ From sumomo @ users.sourceforge.jp Tue Oct 7 03:08:54 2008 From: sumomo @ users.sourceforge.jp (sumomo @ users.sourceforge.jp) Date: Tue, 07 Oct 2008 03:08:54 +0900 Subject: [Julius-cvs 322] CVS update: julius4/libsent/src/ngram Message-ID: <1223316534.751910.12503.nullmailer@users.sourceforge.jp> Index: julius4/libsent/src/ngram/ngram_read_arpa.c diff -u julius4/libsent/src/ngram/ngram_read_arpa.c:1.7 julius4/libsent/src/ngram/ngram_read_arpa.c:1.8 --- julius4/libsent/src/ngram/ngram_read_arpa.c:1.7 Thu Mar 20 18:08:04 2008 +++ julius4/libsent/src/ngram/ngram_read_arpa.c Tue Oct 7 03:08:54 2008 @@ -20,7 +20,7 @@ * @author Akinobu LEE * @date Wed Feb 16 16:52:24 2005 * - * $Revision: 1.7 $ + * $Revision: 1.8 $ * */ /* @@ -30,7 +30,7 @@ * All rights reserved */ -/* $Id: ngram_read_arpa.c,v 1.7 2008/03/20 09:08:04 sumomo Exp $ */ +/* $Id: ngram_read_arpa.c,v 1.8 2008/10/06 18:08:54 sumomo Exp $ */ /* words should be alphabetically sorted */ @@ -284,8 +284,8 @@ return FALSE; } w[0] = ngram_lookup_word(ndata, s); - if (w[1] == WORD_INVALID) { - jlog("Error: ngram_read_arpa: 2-gram #%d: \"%s\": \"%s\" not exist in 1-gram\n", n2+1, pbuf, s); + if (w[0] == WORD_INVALID) { + jlog("Error: ngram_read_arpa: 2-gram #%d: \"%s\": \"%s\" not exist in 1-gram\n", bi_count, pbuf, s); ok_p = FALSE; continue; } @@ -294,8 +294,8 @@ return FALSE; } w[1] = ngram_lookup_word(ndata, s); - if (w[0] == WORD_INVALID) { - jlog("Error: ngram_read_arpa: 2-gram #%d: \"%s\": \"%s\" not exist in 1-gram\n", n2+1, pbuf, s); + if (w[1] == WORD_INVALID) { + jlog("Error: ngram_read_arpa: 2-gram #%d: \"%s\": \"%s\" not exist in 1-gram\n", bi_count, pbuf, s); ok_p = FALSE; continue; } From sumomo @ users.sourceforge.jp Tue Oct 7 03:09:27 2008 From: sumomo @ users.sourceforge.jp (sumomo @ users.sourceforge.jp) Date: Tue, 07 Oct 2008 03:09:27 +0900 Subject: [Julius-cvs 323] CVS update: julius4/libjulius/src Message-ID: <1223316567.323788.12723.nullmailer@users.sourceforge.jp> Index: julius4/libjulius/src/m_jconf.c diff -u julius4/libjulius/src/m_jconf.c:1.4 julius4/libjulius/src/m_jconf.c:1.5 --- julius4/libjulius/src/m_jconf.c:1.4 Thu Jun 19 01:20:55 2008 +++ julius4/libjulius/src/m_jconf.c Tue Oct 7 03:09:27 2008 @@ -37,7 +37,7 @@ * @author Akinobu Lee * @date Thu May 12 14:16:18 2005 * - * $Revision: 1.4 $ + * $Revision: 1.5 $ * */ /* @@ -127,6 +127,7 @@ } #endif } + prev_c = c; } buf[pos] = '\0'; @@ -411,7 +412,7 @@ dst_from = dst; while (*p != '\0' && (!ISTOKEN(*p))) { - if (0 &&/* '\' is removed by fgets_jconf */ *p == '\\') { /* escape by '\' */ + if (*p == '\\') { /* escape by '\' */ if (*(++p) == '\0') break; *(dst++) = *(p++); } else { From sumomo @ users.sourceforge.jp Tue Oct 7 03:10:05 2008 From: sumomo @ users.sourceforge.jp (sumomo @ users.sourceforge.jp) Date: Tue, 07 Oct 2008 03:10:05 +0900 Subject: [Julius-cvs 324] CVS update: julius4/libjulius Message-ID: <1223316605.114396.13845.nullmailer@users.sourceforge.jp> Index: julius4/libjulius/configure diff -u julius4/libjulius/configure:1.6 julius4/libjulius/configure:1.7 --- julius4/libjulius/configure:1.6 Fri Oct 3 00:01:59 2008 +++ julius4/libjulius/configure Tue Oct 7 03:10:04 2008 @@ -1733,24 +1733,119 @@ EOF +echo $ac_n "checking for dlopen""... $ac_c" 1>&6 +echo "configure:1738: checking for dlopen" >&5 +if eval "test \"`echo '$''{'ac_cv_func_dlopen'+set}'`\" = set"; then + echo $ac_n "(cached) $ac_c" 1>&6 +else + cat > conftest.$ac_ext < +/* Override any gcc2 internal prototype to avoid an error. */ +/* We use char because int might match the return type of a gcc2 + builtin and then its argument prototype would still apply. */ +char dlopen(); + +int main() { + +/* The GNU C library defines this for functions which it implements + to always fail with ENOSYS. Some functions are actually named + something starting with __ and the normal name is an alias. */ +#if defined (__stub_dlopen) || defined (__stub___dlopen) +choke me +#else +dlopen(); +#endif + +; return 0; } +EOF +if { (eval echo configure:1766: \"$ac_link\") 1>&5; (eval $ac_link) 2>&5; } && test -s conftest${ac_exeext}; then + rm -rf conftest* + eval "ac_cv_func_dlopen=yes" +else + echo "configure: failed program was:" >&5 + cat conftest.$ac_ext >&5 + rm -rf conftest* + eval "ac_cv_func_dlopen=no" +fi +rm -f conftest* +fi + +if eval "test \"`echo '$ac_cv_func_'dlopen`\" = yes"; then + echo "$ac_t""yes" 1>&6 + : +else + echo "$ac_t""no" 1>&6 +echo $ac_n "checking for dlopen in -ldl""... $ac_c" 1>&6 +echo "configure:1784: checking for dlopen in -ldl" >&5 +ac_lib_var=`echo dl'_'dlopen | sed 'y%./+-%__p_%'` +if eval "test \"`echo '$''{'ac_cv_lib_$ac_lib_var'+set}'`\" = set"; then + echo $ac_n "(cached) $ac_c" 1>&6 +else + ac_save_LIBS="$LIBS" +LIBS="-ldl $LIBS" +cat > conftest.$ac_ext <&5; (eval $ac_link) 2>&5; } && test -s conftest${ac_exeext}; then + rm -rf conftest* + eval "ac_cv_lib_$ac_lib_var=yes" +else + echo "configure: failed program was:" >&5 + cat conftest.$ac_ext >&5 + rm -rf conftest* + eval "ac_cv_lib_$ac_lib_var=no" +fi +rm -f conftest* +LIBS="$ac_save_LIBS" + +fi +if eval "test \"`echo '$ac_cv_lib_'$ac_lib_var`\" = yes"; then + echo "$ac_t""yes" 1>&6 + ac_tr_lib=HAVE_LIB`echo dl | sed -e 's/^a-zA-Z0-9_/_/g' \ + -e 'y/abcdefghijklmnopqrstuvwxyz/ABCDEFGHIJKLMNOPQRSTUVWXYZ/'` + cat >> confdefs.h <&6 +fi + +fi + if test "$want_pthread" = yes; then case "$host_os" in freebsd*) # FreeBSD echo $ac_n "checking for linking POSIX threaded process""... $ac_c" 1>&6 -echo "configure:1743: checking for linking POSIX threaded process" >&5 +echo "configure:1838: checking for linking POSIX threaded process" >&5 ac_save_CFLAGS="$CFLAGS" CFLAGS="$CFLAGS -pthread" cat > conftest.$ac_ext < int main() { pthread_equal(NULL,NULL); ; return 0; } EOF -if { (eval echo configure:1754: \"$ac_link\") 1>&5; (eval $ac_link) 2>&5; } && test -s conftest${ac_exeext}; then +if { (eval echo configure:1849: \"$ac_link\") 1>&5; (eval $ac_link) 2>&5; } && test -s conftest${ac_exeext}; then rm -rf conftest* use_pthread=yes cat >> confdefs.h <<\EOF @@ -1771,18 +1866,18 @@ *) # other with libpthread echo $ac_n "checking for POSIX thread library in -lpthread""... $ac_c" 1>&6 -echo "configure:1775: checking for POSIX thread library in -lpthread" >&5 +echo "configure:1870: checking for POSIX thread library in -lpthread" >&5 ac_save_LIBS_p="$LIBS" LIBS="$LIBS -lpthread" cat > conftest.$ac_ext < int main() { pthread_equal(NULL,NULL); ; return 0; } EOF -if { (eval echo configure:1786: \"$ac_link\") 1>&5; (eval $ac_link) 2>&5; } && test -s conftest${ac_exeext}; then +if { (eval echo configure:1881: \"$ac_link\") 1>&5; (eval $ac_link) 2>&5; } && test -s conftest${ac_exeext}; then rm -rf conftest* use_pthread=yes cat >> confdefs.h <<\EOF Index: julius4/libjulius/configure.in diff -u julius4/libjulius/configure.in:1.6 julius4/libjulius/configure.in:1.7 --- julius4/libjulius/configure.in:1.6 Fri Oct 3 00:01:59 2008 +++ julius4/libjulius/configure.in Tue Oct 7 03:10:04 2008 @@ -4,7 +4,7 @@ dnl Copyright (c) 2005-2007 Julius project team, Nagoya Institute of Technology dnl All rights reserved dnl -dnl $Id: configure.in,v 1.6 2008/10/02 15:01:59 sumomo Exp $ +dnl $Id: configure.in,v 1.7 2008/10/06 18:10:04 sumomo Exp $ dnl AC_INIT(src/search_bestfirst_main.c) @@ -341,6 +341,7 @@ dnl AC_CHECK_FUNCS(strdup strstr) dnl AC_CHECK_FUNC(gethostbyname,,AC_CHECK_LIB(nsl,gethostbyname)) dnl AC_CHECK_FUNC(connect,,AC_CHECK_LIB(socket, connect)) +AC_CHECK_FUNC(dlopen,,AC_CHECK_LIB(dl, dlopen)) dnl check for POSIX thread support if test "$want_pthread" = yes; then From sumomo @ users.sourceforge.jp Sun Oct 12 08:11:50 2008 From: sumomo @ users.sourceforge.jp (sumomo @ users.sourceforge.jp) Date: Sun, 12 Oct 2008 08:11:50 +0900 Subject: [Julius-cvs 325] CVS update: julius4/julius Message-ID: <1223766710.624069.28740.nullmailer@users.sourceforge.jp> Index: julius4/julius/module.c diff -u julius4/julius/module.c:1.6 julius4/julius/module.c:1.7 --- julius4/julius/module.c:1.6 Thu Sep 25 13:56:20 2008 +++ julius4/julius/module.c Sun Oct 12 08:11:50 2008 @@ -88,20 +88,22 @@ * */ static boolean -read_grammar(FILE *fp, DFA_INFO **ret_dfa, WORD_INFO **ret_winfo, HTK_HMM_INFO *hmminfo) +read_grammar(FILE *fp, DFA_INFO **ret_dfa, WORD_INFO **ret_winfo, HTK_HMM_INFO *hmminfo, boolean lmvar) { - DFA_INFO *dfa; + DFA_INFO *dfa = NULL; WORD_INFO *winfo; /* load grammar: dfa and dict in turn */ - dfa = dfa_info_new(); - if (!rddfa_fp(fp, dfa)) { - return FALSE; + if (lmvar != LM_DFA_WORD) { + dfa = dfa_info_new(); + if (!rddfa_fp(fp, dfa)) { + return FALSE; + } } winfo = word_info_new(); /* ignore MONOTREE */ if (!voca_load_htkdict_fp(fp, winfo, hmminfo, FALSE)) { - dfa_info_free(dfa); + if (dfa) dfa_info_free(dfa); return FALSE; } *ret_dfa = dfa; @@ -246,7 +248,7 @@ p = NULL; } /* read a new grammar via socket */ - if (read_grammar(module_fp, &new_dfa, &new_winfo, cur->am->hmminfo) == FALSE) { + if (read_grammar(module_fp, &new_dfa, &new_winfo, cur->am->hmminfo, cur->lmvar) == FALSE) { module_send(module_sd, "\n.\n"); } else { if (cur->lmtype == LM_DFA) { @@ -280,7 +282,7 @@ p = NULL; } /* read a new grammar via socket */ - if (read_grammar(module_fp, &new_dfa, &new_winfo, cur->am->hmminfo) == FALSE) { + if (read_grammar(module_fp, &new_dfa, &new_winfo, cur->am->hmminfo, cur->lmvar) == FALSE) { module_send(module_sd, "\n.\n"); } else { if (cur->lmtype == LM_DFA) { Index: julius4/julius/output_module.c diff -u julius4/julius/output_module.c:1.2 julius4/julius/output_module.c:1.3 --- julius4/julius/output_module.c:1.2 Tue Dec 18 17:45:48 2007 +++ julius4/julius/output_module.c Sun Oct 12 08:11:50 2008 @@ -12,7 +12,7 @@ * @author Akinobu Lee * @date Tue Sep 06 14:46:49 2005 * - * $Revision: 1.2 $ + * $Revision: 1.3 $ * */ /* @@ -659,10 +659,14 @@ module_send(module_sd, "\n"); for(m=r->lm->grammars;m;m=m->next) { - module_send(module_sd, " #%2d: [%-11s] %4d words, %3d categories, %4d nodes", + module_send(module_sd, " #%2d: [%-11s] %4d words", m->id, m->active ? "active" : "inactive", - m->winfo->num, m->dfa->term_num, m->dfa->state_num); + m->winfo->num); + if (m->dfa) { + module_send(module_sd, ", %3d categories, %4d nodes", + m->dfa->term_num, m->dfa->state_num); + } if (m->newbie) module_send(module_sd, " (new)"); if (m->hook != MULTIGRAM_DEFAULT) { module_send(module_sd, " (next: %s)", hookstr[m->hook]); From sumomo @ users.sourceforge.jp Mon Oct 13 17:43:43 2008 From: sumomo @ users.sourceforge.jp (sumomo @ users.sourceforge.jp) Date: Mon, 13 Oct 2008 17:43:43 +0900 Subject: [Julius-cvs 326] CVS update: julius4/libjulius/src Message-ID: <1223887423.265240.24410.nullmailer@users.sourceforge.jp> Index: julius4/libjulius/src/m_options.c diff -u julius4/libjulius/src/m_options.c:1.15 julius4/libjulius/src/m_options.c:1.16 --- julius4/libjulius/src/m_options.c:1.15 Thu Sep 25 14:00:06 2008 +++ julius4/libjulius/src/m_options.c Mon Oct 13 17:43:43 2008 @@ -18,7 +18,7 @@ * @author Akinobu Lee * @date Thu May 12 18:52:07 2005 * - * $Revision: 1.15 $ + * $Revision: 1.16 $ * */ /* @@ -283,6 +283,16 @@ if ((lmconf = j_get_lmconf_by_name(jconf, tmparg)) == NULL) return FALSE; } + /* check to avoid assigning an LM for multiple SR */ + for(sconf=jconf->search_root;sconf;sconf=sconf->next) { + if (sconf->lmconf == lmconf) { + jlog("ERROR: you are going to share LM \"%s\" among multiple SRs\n"); + jlog("ERROR: current Julius cannot share LM among SRs\n"); + jlog("ERROR: you should define LM for each SR\n"); + return FALSE; + } + } + /* if not first time, create new module instance and switch to it */ sconf = j_jconf_search_new(); sconf->amconf = amconf; From sumomo @ users.sourceforge.jp Thu Oct 16 01:06:33 2008 From: sumomo @ users.sourceforge.jp (sumomo @ users.sourceforge.jp) Date: Thu, 16 Oct 2008 01:06:33 +0900 Subject: [Julius-cvs 327] CVS update: julius4/libsent/src/ngram Message-ID: <1224086793.921132.16778.nullmailer@users.sourceforge.jp> Index: julius4/libsent/src/ngram/ngram_read_arpa.c diff -u julius4/libsent/src/ngram/ngram_read_arpa.c:1.8 julius4/libsent/src/ngram/ngram_read_arpa.c:1.9 --- julius4/libsent/src/ngram/ngram_read_arpa.c:1.8 Tue Oct 7 03:08:54 2008 +++ julius4/libsent/src/ngram/ngram_read_arpa.c Thu Oct 16 01:06:33 2008 @@ -20,7 +20,7 @@ * @author Akinobu LEE * @date Wed Feb 16 16:52:24 2005 * - * $Revision: 1.8 $ + * $Revision: 1.9 $ * */ /* @@ -30,7 +30,7 @@ * All rights reserved */ -/* $Id: ngram_read_arpa.c,v 1.8 2008/10/06 18:08:54 sumomo Exp $ */ +/* $Id: ngram_read_arpa.c,v 1.9 2008/10/15 16:06:33 sumomo Exp $ */ /* words should be alphabetically sorted */ @@ -138,10 +138,10 @@ } name = strcpy((char *)mymalloc(strlen(p)+1), p); if ((p = strtok(NULL, DELM)) == NULL) { - jlog("Error: ngram_read_arpa: LR 1-gram: failed to parse, corrupted or invalid data?\n"); - return FALSE; + bo_wt = 0.0; + } else { + bo_wt = (LOGPROB)atof(p); } - bo_wt = (LOGPROB)atof(p); /* register word entry name */ ndata->wname[nid] = name; @@ -217,10 +217,10 @@ } name = strcpy((char *)mymalloc(strlen(p)+1), p); if ((p = strtok(NULL, DELM)) == NULL) { - jlog("Error: ngram_read_arpa: RL 1-gram: failed to parse, corrupted or invalid data?\n"); - return FALSE; + bo_wt = 0.0; + } else { + bo_wt = (LOGPROB)atof(p); } - bo_wt = (LOGPROB)atof(p); /* add bo_wt_rl to existing 1-gram entry */ nid = ngram_lookup_word(ndata, name); @@ -473,8 +473,11 @@ bowt = (LOGPROB) atof(s); if (t->bo_wt == NULL) { t->bo_wt = (LOGPROB *)mymalloc(sizeof(LOGPROB) * t->totalnum); + for(i=0;ibo_wt[nnid] = 0.0; } t->bo_wt[nnid] = bowt; + } else { + if (t->bo_wt != NULL) t->bo_wt[nnid] = 0.0; } /* store the entry info */ From sumomo @ users.sourceforge.jp Fri Oct 17 08:33:23 2008 From: sumomo @ users.sourceforge.jp (sumomo @ users.sourceforge.jp) Date: Fri, 17 Oct 2008 08:33:23 +0900 Subject: [Julius-cvs 328] CVS update: julius4/jcontrol Message-ID: <1224200003.932277.29977.nullmailer@users.sourceforge.jp> Index: julius4/jcontrol/japi.h diff -u julius4/jcontrol/japi.h:1.2 julius4/jcontrol/japi.h:1.3 --- julius4/jcontrol/japi.h:1.2 Tue Dec 18 17:45:48 2007 +++ julius4/jcontrol/japi.h Fri Oct 17 08:33:23 2008 @@ -12,7 +12,7 @@ * @author Akinobu LEE * @date Thu Mar 24 07:12:32 2005 * - * $Revision: 1.2 $ + * $Revision: 1.3 $ * */ /* @@ -92,6 +92,7 @@ void japi_set_input_handler_on_change(int, char *); /* japi_grammar.c */ +void japi_get_graminfo(int sd); void japi_change_grammar(int sd, char *prefixpath); void japi_add_grammar(int sd, char *prefixpath); void japi_delete_grammar(int sd, char *idlist); Index: julius4/jcontrol/japi_grammar.c diff -u julius4/jcontrol/japi_grammar.c:1.2 julius4/jcontrol/japi_grammar.c:1.3 --- julius4/jcontrol/japi_grammar.c:1.2 Tue Dec 18 17:45:48 2007 +++ julius4/jcontrol/japi_grammar.c Fri Oct 17 08:33:23 2008 @@ -12,7 +12,7 @@ * @author Akinobu LEE * @date Thu Mar 24 07:13:41 2005 * - * $Revision: 1.2 $ + * $Revision: 1.3 $ * */ /* @@ -45,13 +45,25 @@ static int check_grammar_path(char *prefix) { - snprintf(buf, MAXLINELEN, "%s.dfa", prefix); - if (access(buf, R_OK) < 0) { - perror("japi_change_grammar"); return -1; - } - snprintf(buf, MAXLINELEN, "%s.dict", prefix); - if (access(buf, R_OK) < 0) { - perror("japi_change_grammar"); return -1; + int i; + + i = strlen(prefix) - 1; + while(prefix[i] != '.' && i >= 0) i--; + if (i < 0 && strcmp(&(prefix[i]), ".dict") != 0) { + snprintf(buf, MAXLINELEN, "%s.dfa", prefix); + if (access(buf, R_OK) < 0) { + fprintf(stderr, "Error: \"%s.dfa\" not exist\n", prefix); + return -1; + } + snprintf(buf, MAXLINELEN, "%s.dict", prefix); + if (access(buf, R_OK) < 0) { + fprintf(stderr, "Error: \"%s.dict\" not exist\n", prefix); + return -1; + } + } else { + if (access(prefix, R_OK) < 0) { + fprintf(stderr, "Error: \"%s\" not exist\n", prefix); + } } return 0; } @@ -78,17 +90,24 @@ send_grammar(int sd, char *prefix) { FILE *fp; - - snprintf(buf, MAXLINELEN, "%s.dfa", prefix); - if ((fp = fopen(buf, "r")) == NULL) { - perror("japi_change_grammar"); return -1; - } - while(fgets(buf, MAXLINELEN, fp) != NULL) { - do_send(sd, buf); + int i; + + i = strlen(prefix) - 1; + while(prefix[i] != '.' && i >= 0) i--; + if (i < 0 && strcmp(&(prefix[i]), ".dict") != 0) { + snprintf(buf, MAXLINELEN, "%s.dfa", prefix); + if ((fp = fopen(buf, "r")) == NULL) { + perror("japi_change_grammar"); return -1; + } + while(fgets(buf, MAXLINELEN, fp) != NULL) { + do_send(sd, buf); + } + do_send(sd, "DFAEND\n"); + fclose(fp); + snprintf(buf, MAXLINELEN, "%s.dict", prefix); + } else { + snprintf(buf, MAXLINELEN, "%s", prefix); } - do_send(sd, "DFAEND\n"); - fclose(fp); - snprintf(buf, MAXLINELEN, "%s.dict", prefix); if ((fp = fopen(buf, "r")) == NULL) { perror("japi_change_grammar"); return -1; } @@ -283,6 +302,12 @@ } void +japi_get_graminfo(int sd) +{ + do_send(sd, "GRAMINFO\n"); +} + +void japi_add_words(int sd, char *idstr, char *dictfile) { FILE *fp; Index: julius4/jcontrol/jcontrol.c diff -u julius4/jcontrol/jcontrol.c:1.3 julius4/jcontrol/jcontrol.c:1.4 --- julius4/jcontrol/jcontrol.c:1.3 Tue May 13 15:32:47 2008 +++ julius4/jcontrol/jcontrol.c Fri Oct 17 08:33:23 2008 @@ -12,7 +12,7 @@ * @author Akinobu LEE * @date Thu Mar 24 11:49:27 2005 * - * $Revision: 1.3 $ + * $Revision: 1.4 $ * */ /* @@ -60,6 +60,8 @@ japi_get_version(sd); } else if (strmatch(com, "status")) { japi_get_status(sd); + } else if (strmatch(com, "graminfo")) { + japi_get_graminfo(sd); } else if (strmatch(com, "pause")) { japi_pause_recog(sd); } else if (strmatch(com, "terminate")) { From sumomo @ users.sourceforge.jp Fri Oct 17 08:43:25 2008 From: sumomo @ users.sourceforge.jp (sumomo @ users.sourceforge.jp) Date: Fri, 17 Oct 2008 08:43:25 +0900 Subject: [Julius-cvs 329] CVS update: julius4/julius Message-ID: <1224200605.215071.6631.nullmailer@users.sourceforge.jp> Index: julius4/julius/module.c diff -u julius4/julius/module.c:1.7 julius4/julius/module.c:1.8 --- julius4/julius/module.c:1.7 Sun Oct 12 08:11:50 2008 +++ julius4/julius/module.c Fri Oct 17 08:43:25 2008 @@ -88,23 +88,30 @@ * */ static boolean -read_grammar(FILE *fp, DFA_INFO **ret_dfa, WORD_INFO **ret_winfo, HTK_HMM_INFO *hmminfo, boolean lmvar) +read_grammar(FILE *fp, DFA_INFO **ret_dfa, WORD_INFO **ret_winfo, HTK_HMM_INFO *hmminfo, RecogProcess *r) { DFA_INFO *dfa = NULL; WORD_INFO *winfo; + JCONF_LM *lmconf; /* load grammar: dfa and dict in turn */ - if (lmvar != LM_DFA_WORD) { + if (r->lmvar != LM_DFA_WORD) { dfa = dfa_info_new(); if (!rddfa_fp(fp, dfa)) { return FALSE; } } winfo = word_info_new(); - /* ignore MONOTREE */ - if (!voca_load_htkdict_fp(fp, winfo, hmminfo, FALSE)) { - if (dfa) dfa_info_free(dfa); - return FALSE; + if (r->lmvar == LM_DFA_WORD) { + lmconf = r->lm->config; + if (!voca_load_wordlist_fp(fp, winfo, hmminfo, lmconf->wordrecog_head_silence_model_name, lmconf->wordrecog_tail_silence_model_name, (lmconf->wordrecog_silence_context_name[0] == '\0') ? NULL : lmconf->wordrecog_silence_context_name)) { + return FALSE; + } + } else { + if (!voca_load_htkdict_fp(fp, winfo, hmminfo, FALSE)) { + dfa_info_free(dfa); + return FALSE; + } } *ret_dfa = dfa; *ret_winfo = winfo; @@ -248,7 +255,7 @@ p = NULL; } /* read a new grammar via socket */ - if (read_grammar(module_fp, &new_dfa, &new_winfo, cur->am->hmminfo, cur->lmvar) == FALSE) { + if (read_grammar(module_fp, &new_dfa, &new_winfo, cur->am->hmminfo, cur) == FALSE) { module_send(module_sd, "\n.\n"); } else { if (cur->lmtype == LM_DFA) { @@ -282,7 +289,7 @@ p = NULL; } /* read a new grammar via socket */ - if (read_grammar(module_fp, &new_dfa, &new_winfo, cur->am->hmminfo, cur->lmvar) == FALSE) { + if (read_grammar(module_fp, &new_dfa, &new_winfo, cur->am->hmminfo, cur) == FALSE) { module_send(module_sd, "\n.\n"); } else { if (cur->lmtype == LM_DFA) { Index: julius4/julius/output_module.c diff -u julius4/julius/output_module.c:1.3 julius4/julius/output_module.c:1.4 --- julius4/julius/output_module.c:1.3 Sun Oct 12 08:11:50 2008 +++ julius4/julius/output_module.c Fri Oct 17 08:43:25 2008 @@ -12,7 +12,7 @@ * @author Akinobu Lee * @date Tue Sep 06 14:46:49 2005 * - * $Revision: 1.3 $ + * $Revision: 1.4 $ * */ /* @@ -657,6 +657,10 @@ { MULTIGRAM *m; + if (r->lmtype == LM_PROB) { + module_send(module_sd, "\n.\n"); + return; + } module_send(module_sd, "\n"); for(m=r->lm->grammars;m;m=m->next) { module_send(module_sd, " #%2d: [%-11s] %4d words", From sumomo @ users.sourceforge.jp Fri Oct 17 08:43:25 2008 From: sumomo @ users.sourceforge.jp (sumomo @ users.sourceforge.jp) Date: Fri, 17 Oct 2008 08:43:25 +0900 Subject: [Julius-cvs 330] CVS update: julius4/libjulius/src Message-ID: <1224200605.398204.6643.nullmailer@users.sourceforge.jp> Index: julius4/libjulius/src/beam.c diff -u julius4/libjulius/src/beam.c:1.8 julius4/libjulius/src/beam.c:1.9 --- julius4/libjulius/src/beam.c:1.8 Thu Feb 21 13:10:05 2008 +++ julius4/libjulius/src/beam.c Fri Oct 17 08:43:25 2008 @@ -42,7 +42,7 @@ * @author Akinobu LEE * @date Tue Feb 22 17:00:45 2005 * - * $Revision: 1.8 $ + * $Revision: 1.9 $ * */ /* @@ -1713,24 +1713,31 @@ } if (r->lmtype == LM_DFA && r->lmvar == LM_DFA_WORD) { - /* all words can appear at start */ - for (i=0;iwinfo->num;i++) { - if (wchmm->hmminfo->multipath) { - node = wchmm->wordbegin[i]; - } else { - node = wchmm->offset[i][0]; - } - if (node_exist_token(d, d->tn, node, d->bos.wid) != TOKENID_UNDEFINED) continue; - newid = create_token(d); - new = &(d->tlist[d->tn][newid]); - new->last_tre = &(d->bos); - new->last_lscore = 0.0; - if (wchmm->hmminfo->multipath) { - new->score = 0.0; - } else { - new->score = outprob_style(wchmm, node, d->bos.wid, 0, param); + /* アクティブな文法に属する単語のみ許す */ + /* only words in active grammars are allowed to be an initial words */ + MULTIGRAM *m; + + for(m = r->lm->grammars; m; m = m->next) { + if (m->active) { + for(i = m->word_begin; i < m->word_begin + m->winfo->num; i++) { + if (wchmm->hmminfo->multipath) { + node = wchmm->wordbegin[i]; + } else { + node = wchmm->offset[i][0]; + } + if (node_exist_token(d, d->tn, node, d->bos.wid) != TOKENID_UNDEFINED) continue; + newid = create_token(d); + new = &(d->tlist[d->tn][newid]); + new->last_tre = &(d->bos); + new->last_lscore = 0.0; + if (wchmm->hmminfo->multipath) { + new->score = 0.0; + } else { + new->score = outprob_style(wchmm, node, d->bos.wid, 0, param); + } + node_assign_token(d, node, newid); + } } - node_assign_token(d, node, newid); } } Index: julius4/libjulius/src/multi-gram.c diff -u julius4/libjulius/src/multi-gram.c:1.5 julius4/libjulius/src/multi-gram.c:1.6 --- julius4/libjulius/src/multi-gram.c:1.5 Tue Aug 5 18:47:56 2008 +++ julius4/libjulius/src/multi-gram.c Fri Oct 17 08:43:25 2008 @@ -47,7 +47,7 @@ * @author Akinobu Lee * @date Sat Jun 18 23:45:18 2005 * - * $Revision: 1.5 $ + * $Revision: 1.6 $ * */ /* @@ -688,9 +688,9 @@ } if (m->newbie) m->newbie = FALSE; if (lm->lmvar == LM_DFA_WORD) { - /* just append dictionaty (category ID is bogus here) */ + /* just append dictionaty */ m->word_begin = lm->winfo->num; - if (voca_append(lm->winfo, m->winfo, 0, m->word_begin) == FALSE) { + if (voca_append(lm->winfo, m->winfo, m->id, m->word_begin) == FALSE) { jlog("ERROR: multi-gram: failed to add dictionary #%d to recognition network\n", m->id); /* mark as delete */ m->hook |= MULTIGRAM_DELETE; @@ -722,9 +722,9 @@ } if (m->newbie) m->newbie = FALSE; if (lm->lmvar == LM_DFA_WORD) { - /* just append dictionaty (category ID is bogus here) */ + /* just append dictionaty */ m->word_begin = lm->winfo->num; - if (voca_append(lm->winfo, m->winfo, 0, m->word_begin) == FALSE) { + if (voca_append(lm->winfo, m->winfo, m->id, m->word_begin) == FALSE) { jlog("ERROR: multi-gram: failed to add dictionary #%d to recognition network\n", m->id); /* mark as delete */ m->hook |= MULTIGRAM_DELETE; @@ -762,7 +762,6 @@ #ifdef MDEBUG jlog("STAT: grammar update completed\n"); #endif - } if (lm->global_modified || active_changed) { return (TRUE); @@ -1143,7 +1142,7 @@ offset = m->winfo->num; printf("adding %d words to grammar #%d (%d words)\n", winfo->num, m->id, m->winfo->num); /* append to the grammar */ - if (voca_append(m->winfo, winfo, 0, offset) == FALSE) { + if (voca_append(m->winfo, winfo, m->id, offset) == FALSE) { jlog("ERROR: multi-gram: failed to add words to dict in grammar #%d \"%s\"\n", m->id, m->name); return FALSE; } Index: julius4/libjulius/src/wchmm.c diff -u julius4/libjulius/src/wchmm.c:1.5 julius4/libjulius/src/wchmm.c:1.6 --- julius4/libjulius/src/wchmm.c:1.5 Tue Sep 30 12:58:17 2008 +++ julius4/libjulius/src/wchmm.c Fri Oct 17 08:43:25 2008 @@ -31,7 +31,7 @@ * @author Akinobu Lee * @date Mon Sep 19 23:39:15 2005 * - * $Revision: 1.5 $ + * $Revision: 1.6 $ * */ /* @@ -1652,7 +1652,7 @@ /* 最も長く音素を共有出来る単語を探す */ maxsharelen=0; for (j=0;jcategory_tree && wchmm->lmvar == LM_DFA_GRAMMAR) { + if (wchmm->category_tree && wchmm->lmtype == LM_DFA) { if (wchmm->winfo->wton[i] != wchmm->winfo->wton[j]) continue; } sharelen = wchmm_check_match(wchmm->winfo, i, j); @@ -1811,7 +1811,7 @@ windex = (WORD_ID *)mymalloc(sizeof(WORD_ID) * wchmm->winfo->num); for(i=0;iwinfo->num;i++) windex[i] = i; - if (wchmm->category_tree && wchmm->lmvar == LM_DFA_GRAMMAR) { + if (wchmm->category_tree && wchmm->lmtype == LM_DFA) { /* sort by category -> sort by word ID in each category */ wchmm_sort_idx_by_category(wchmm->winfo, windex, wchmm->winfo->num); @@ -1903,7 +1903,7 @@ ret = wchmm_add_word(wchmm, i, 0, 0, lmconf->enable_iwsp); } else { /* the previous word (last_i) is always the most matched one */ - if (wchmm->category_tree && wchmm->lmvar == LM_DFA_GRAMMAR) { + if (wchmm->category_tree && wchmm->lmtype == LM_DFA) { if (wchmm->winfo->wton[i] != wchmm->winfo->wton[last_i]) { ret = wchmm_add_word(wchmm, i, 0, 0, lmconf->enable_iwsp); } else { From sumomo @ users.sourceforge.jp Fri Oct 17 08:43:25 2008 From: sumomo @ users.sourceforge.jp (sumomo @ users.sourceforge.jp) Date: Fri, 17 Oct 2008 08:43:25 +0900 Subject: [Julius-cvs 331] CVS update: julius4/libsent/include/sent Message-ID: <1224200605.546069.6652.nullmailer@users.sourceforge.jp> Index: julius4/libsent/include/sent/vocabulary.h diff -u julius4/libsent/include/sent/vocabulary.h:1.3 julius4/libsent/include/sent/vocabulary.h:1.4 --- julius4/libsent/include/sent/vocabulary.h:1.3 Tue Aug 5 18:50:53 2008 +++ julius4/libsent/include/sent/vocabulary.h Fri Oct 17 08:43:25 2008 @@ -30,7 +30,7 @@ * @author Akinobu LEE * @date Sat Feb 12 12:38:13 2005 * - * $Revision: 1.3 $ + * $Revision: 1.4 $ * */ /* @@ -103,6 +103,7 @@ boolean voca_load_word_line(char *buf, WORD_INFO *winfo, HTK_HMM_INFO *hmminfo, char *headphone, char *tailpohone, char *contextphone); boolean voca_load_wordlist(FILE *fp, WORD_INFO *winfo, HTK_HMM_INFO *hmminfo, char *headphone, char *tailphone, char *contextphone); +boolean voca_load_wordlist_fp(FILE *fp, WORD_INFO *winfo, HTK_HMM_INFO *hmminfo, char *headphone, char *tailphone, char *contextphone); boolean voca_load_wordlist_line(char *buf, WORD_ID *vnum, int linenum, WORD_INFO *winfo, HTK_HMM_INFO *hmminfo, boolean do_conv, boolean *ok_flag, char *headphone, char *tailphone, char *contextphone); boolean voca_mono2tri(WORD_INFO *winfo, HTK_HMM_INFO *hmminfo); WORD_ID voca_lookup_wid(char *, WORD_INFO *); From sumomo @ users.sourceforge.jp Fri Oct 17 08:43:25 2008 From: sumomo @ users.sourceforge.jp (sumomo @ users.sourceforge.jp) Date: Fri, 17 Oct 2008 08:43:25 +0900 Subject: [Julius-cvs 332] CVS update: julius4/libsent/src/voca Message-ID: <1224200605.733937.6661.nullmailer@users.sourceforge.jp> Index: julius4/libsent/src/voca/voca_load_htkdict.c diff -u julius4/libsent/src/voca/voca_load_htkdict.c:1.5 julius4/libsent/src/voca/voca_load_htkdict.c:1.6 --- julius4/libsent/src/voca/voca_load_htkdict.c:1.5 Tue Sep 30 12:58:18 2008 +++ julius4/libsent/src/voca/voca_load_htkdict.c Fri Oct 17 08:43:25 2008 @@ -19,7 +19,7 @@ * @author Akinobu LEE * @date Fri Feb 18 19:43:06 2005 * - * $Revision: 1.5 $ + * $Revision: 1.6 $ * */ /* @@ -645,6 +645,9 @@ int i; n = woffset; + while (n >= dstinfo->maxnum) { + if (winfo_expand(dstinfo) == FALSE) return FALSE; + } for(w=0;wnum;w++) { /* copy data */ dstinfo->wlen[n] = srcinfo->wlen[w]; @@ -662,12 +665,10 @@ if (n >= dstinfo->maxnum) { if (winfo_expand(dstinfo) == FALSE) return FALSE; } + } dstinfo->num = n; - /* compute maxwn */ - voca_set_stats(dstinfo); - - return TRUE; + return(voca_load_end(dstinfo)); } Index: julius4/libsent/src/voca/voca_load_wordlist.c diff -u julius4/libsent/src/voca/voca_load_wordlist.c:1.4 julius4/libsent/src/voca/voca_load_wordlist.c:1.5 --- julius4/libsent/src/voca/voca_load_wordlist.c:1.4 Tue Sep 30 12:58:18 2008 +++ julius4/libsent/src/voca/voca_load_wordlist.c Fri Oct 17 08:43:25 2008 @@ -13,7 +13,7 @@ * @author Akinobu LEE * @date Sun Jul 22 13:29:32 2007 * - * $Revision: 1.4 $ + * $Revision: 1.5 $ * */ /* @@ -127,7 +127,7 @@ return TRUE; } /** - * Top function to read word list via file pointer + * Top function to read word list via text * * @param fp [in] file pointer * @param winfo [out] pointer to word dictionary to store the read data. @@ -152,6 +152,33 @@ return(ret); } + +/** + * Top function to read word list via file pointer + * + * @param fp [in] file pointer + * @param winfo [out] pointer to word dictionary to store the read data. + * @param hmminfo [in] HTK %HMM definition data. if NULL, phonemes are ignored. + * @param headphone [in] word head silence model name + * @param tailphone [in] word tail silence model name + * @param contextphone [in] silence context name to be used at head and tail + * + * @return TRUE on success, FALSE on any error word. + */ +boolean +voca_load_wordlist_fp(FILE *fp, WORD_INFO *winfo, HTK_HMM_INFO *hmminfo, char *headphone, char *tailphone, char *contextphone) +{ + boolean ret; + + voca_load_start(winfo, hmminfo, FALSE); + while (getl_fp(buf, sizeof(buf), fp) != NULL) { + if (voca_load_word_line(buf, winfo, hmminfo, headphone, tailphone, contextphone) == FALSE) break; + } + ret = voca_load_end(winfo); + + return(ret); +} + /** * Sub function to Add a dictionary entry line to the word dictionary. * @@ -421,6 +448,7 @@ winfo->wseq[vnum] = (HMM_Logical **)mybmalloc2(sizeof(HMM_Logical *) * len, &(winfo->mroot)); memcpy(winfo->wseq[vnum], tmpwseq, sizeof(HMM_Logical *) * len); winfo->wlen[vnum] = len; + winfo->wton[vnum] = 0; } vnum++; From sumomo @ users.sourceforge.jp Fri Oct 17 23:49:21 2008 From: sumomo @ users.sourceforge.jp (sumomo @ users.sourceforge.jp) Date: Fri, 17 Oct 2008 23:49:21 +0900 Subject: [Julius-cvs 333] CVS update: julius4/libjulius/src Message-ID: <1224254961.130614.24723.nullmailer@users.sourceforge.jp> Index: julius4/libjulius/src/multi-gram.c diff -u julius4/libjulius/src/multi-gram.c:1.6 julius4/libjulius/src/multi-gram.c:1.7 --- julius4/libjulius/src/multi-gram.c:1.6 Fri Oct 17 08:43:25 2008 +++ julius4/libjulius/src/multi-gram.c Fri Oct 17 23:49:20 2008 @@ -47,7 +47,7 @@ * @author Akinobu Lee * @date Sat Jun 18 23:45:18 2005 * - * $Revision: 1.6 $ + * $Revision: 1.7 $ * */ /* @@ -762,6 +762,7 @@ #ifdef MDEBUG jlog("STAT: grammar update completed\n"); #endif + } if (lm->global_modified || active_changed) { return (TRUE); From sumomo @ users.sourceforge.jp Mon Oct 20 17:40:08 2008 From: sumomo @ users.sourceforge.jp (sumomo @ users.sourceforge.jp) Date: Mon, 20 Oct 2008 17:40:08 +0900 Subject: [Julius-cvs 334] CVS update: julius4/libsent/src/voca Message-ID: <1224492008.203704.30331.nullmailer@users.sourceforge.jp> Index: julius4/libsent/src/voca/voca_load_htkdict.c diff -u julius4/libsent/src/voca/voca_load_htkdict.c:1.6 julius4/libsent/src/voca/voca_load_htkdict.c:1.7 --- julius4/libsent/src/voca/voca_load_htkdict.c:1.6 Fri Oct 17 08:43:25 2008 +++ julius4/libsent/src/voca/voca_load_htkdict.c Mon Oct 20 17:40:07 2008 @@ -19,7 +19,7 @@ * @author Akinobu LEE * @date Fri Feb 18 19:43:06 2005 * - * $Revision: 1.6 $ + * $Revision: 1.7 $ * */ /* @@ -669,6 +669,9 @@ } dstinfo->num = n; - return(voca_load_end(dstinfo)); + /* compute maxwn */ + voca_set_stats(dstinfo); + + return TRUE; } From sumomo @ users.sourceforge.jp Tue Oct 21 02:40:23 2008 From: sumomo @ users.sourceforge.jp (sumomo @ users.sourceforge.jp) Date: Tue, 21 Oct 2008 02:40:23 +0900 Subject: [Julius-cvs 335] CVS update: julius4/julius Message-ID: <1224524423.464230.8233.nullmailer@users.sourceforge.jp> Index: julius4/julius/output_module.c diff -u julius4/julius/output_module.c:1.4 julius4/julius/output_module.c:1.5 --- julius4/julius/output_module.c:1.4 Fri Oct 17 08:43:25 2008 +++ julius4/julius/output_module.c Tue Oct 21 02:40:23 2008 @@ -12,7 +12,7 @@ * @author Akinobu Lee * @date Tue Sep 06 14:46:49 2005 * - * $Revision: 1.4 $ + * $Revision: 1.5 $ * */ /* @@ -29,10 +29,6 @@ extern int module_sd; extern boolean separate_score_flag; - -/// Grammar status to be processed in the next reload timing. -static char *hookstr[] = {"", "delete", "activate", "deactivate"}; - /**********************************************************************/ /* process online/offline status */ @@ -656,6 +652,7 @@ send_gram_info(RecogProcess *r) { MULTIGRAM *m; + char buf[1024]; if (r->lmtype == LM_PROB) { module_send(module_sd, "\n.\n"); @@ -663,19 +660,34 @@ } module_send(module_sd, "\n"); for(m=r->lm->grammars;m;m=m->next) { - module_send(module_sd, " #%2d: [%-11s] %4d words", - m->id, - m->active ? "active" : "inactive", - m->winfo->num); + buf[0] = '\0'; if (m->dfa) { - module_send(module_sd, ", %3d categories, %4d nodes", - m->dfa->term_num, m->dfa->state_num); + snprintf(buf, 1024, ", %3d categories, %4d nodes", + m->dfa->term_num, m->dfa->state_num); } - if (m->newbie) module_send(module_sd, " (new)"); - if (m->hook != MULTIGRAM_DEFAULT) { - module_send(module_sd, " (next: %s)", hookstr[m->hook]); + if (m->newbie) strcat(buf, " (new)"); + if (m->hook != 0) { + strcat(buf, " (next:"); + if (m->hook & MULTIGRAM_DELETE) { + strcat(buf, " delete"); + } + if (m->hook & MULTIGRAM_ACTIVATE) { + strcat(buf, " activate"); + } + if (m->hook & MULTIGRAM_DEACTIVATE) { + strcat(buf, " deactivate"); + } + if (m->hook & MULTIGRAM_MODIFIED) { + strcat(buf, " modified"); + } + strcat(buf, ")"); } - module_send(module_sd, " \"%s\"\n", m->name); + module_send(module_sd, " #%2d: [%-11s] %4d words%s \"%s\"\n", + m->id, + m->active ? "active" : "inactive", + m->winfo->num, + buf, + m->name); } if (r->lm->dfa != NULL) { module_send(module_sd, " Global: %4d words, %3d categories, %4d nodes\n", r->lm->winfo->num, r->lm->dfa->term_num, r->lm->dfa->state_num); Index: julius4/julius/output_stdout.c diff -u julius4/julius/output_stdout.c:1.5 julius4/julius/output_stdout.c:1.6 --- julius4/julius/output_stdout.c:1.5 Tue Mar 18 01:58:37 2008 +++ julius4/julius/output_stdout.c Tue Oct 21 02:40:23 2008 @@ -12,7 +12,7 @@ * @author Akinobu Lee * @date Tue Sep 06 17:18:46 2005 * - * $Revision: 1.5 $ + * $Revision: 1.6 $ * */ /* @@ -26,9 +26,6 @@ extern boolean separate_score_flag; -/// Grammar status to be processed in the next reload timing. -static char *hookstr[] = {"", "delete", "activate", "deactivate"}; - static boolean have_progout = FALSE; /* for short pause segmentation and successive decoding */ @@ -1182,6 +1179,7 @@ MULTIGRAM *m; RecogProcess *r; boolean multi; + char buf[1024]; if (recog->process_list->next != NULL) multi = TRUE; else multi = FALSE; @@ -1189,18 +1187,40 @@ for(r=recog->process_list;r;r=r->next) { if (! r->live) continue; if (multi) printf("[#%d %s]\n", r->config->id, r->config->name); - + if (r->lmtype == LM_PROB) { + printf("NOT A GRAMMAR-BASED LM\n"); + continue; + } printf("[grammars]\n"); for(m=r->lm->grammars;m;m=m->next) { - printf(" #%2d: [%-11s] %4d words, %3d categories, %4d nodes", - m->id, - m->active ? "active" : "inactive", - m->winfo->num, m->dfa->term_num, m->dfa->state_num); - if (m->newbie) printf(" (new)"); - if (m->hook != MULTIGRAM_DEFAULT) { - printf(" (next: %s)", hookstr[m->hook]); + buf[0] = '\0'; + if (m->dfa) { + snprintf(buf, 1024, ", %3d categories, %4d nodes", + m->dfa->term_num, m->dfa->state_num); + } + if (m->newbie) strcat(buf, " (new)"); + if (m->hook != 0) { + strcat(buf, " (next:"); + if (m->hook & MULTIGRAM_DELETE) { + strcat(buf, " delete"); + } + if (m->hook & MULTIGRAM_ACTIVATE) { + strcat(buf, " activate"); + } + if (m->hook & MULTIGRAM_DEACTIVATE) { + strcat(buf, " deactivate"); + } + if (m->hook & MULTIGRAM_MODIFIED) { + strcat(buf, " modified"); + } + strcat(buf, ")"); } - myprintf(" \"%s\"\n", m->name); + myprintf(" #%2d: [%-11s] %4d words%s \"%s\"\n", + m->id, + m->active ? "active" : "inactive", + m->winfo->num, + buf, + m->name); } if (r->lm->dfa != NULL) { printf(" Global: %4d words, %3d categories, %4d nodes\n", r->lm->winfo->num, r->lm->dfa->term_num, r->lm->dfa->state_num);