Sogl-coder commited on
Commit
a2537c1
·
unverified ·
1 Parent(s): b062b12

examples: Update README.md of main.cpp (#1306)

Browse files
Files changed (1) hide show
  1. README.md +11 -4
README.md CHANGED
@@ -113,30 +113,37 @@ options:
113
  -d N, --duration N [0 ] duration of audio to process in milliseconds
114
  -mc N, --max-context N [-1 ] maximum number of text context tokens to store
115
  -ml N, --max-len N [0 ] maximum segment length in characters
116
- -bo N, --best-of N [5 ] number of best candidates to keep
 
117
  -bs N, --beam-size N [-1 ] beam size for beam search
118
  -wt N, --word-thold N [0.01 ] word timestamp probability threshold
119
  -et N, --entropy-thold N [2.40 ] entropy threshold for decoder fail
120
  -lpt N, --logprob-thold N [-1.00 ] log probability threshold for decoder fail
121
- -su, --speed-up [false ] speed up audio by x2 (reduced accuracy)
122
  -tr, --translate [false ] translate from source language to english
123
- -tdrz, --tinydiarize [false ] enable tinydiarize (requires a tdrz model)
124
  -di, --diarize [false ] stereo audio diarization
 
125
  -nf, --no-fallback [false ] do not use temperature fallback while decoding
126
  -otxt, --output-txt [false ] output result in a text file
127
  -ovtt, --output-vtt [false ] output result in a vtt file
128
  -osrt, --output-srt [false ] output result in a srt file
 
129
  -owts, --output-words [false ] output script for generating karaoke video
 
130
  -ocsv, --output-csv [false ] output result in a CSV file
 
131
  -of FNAME, --output-file FNAME [ ] output file path (without file extension)
132
  -ps, --print-special [false ] print special tokens
133
  -pc, --print-colors [false ] print colors
134
  -pp, --print-progress [false ] print progress
135
- -nt, --no-timestamps [true ] do not print timestamps
136
  -l LANG, --language LANG [en ] spoken language ('auto' for auto-detect)
 
137
  --prompt PROMPT [ ] initial prompt
138
  -m FNAME, --model FNAME [models/ggml-base.en.bin] model path
139
  -f FNAME, --file FNAME [ ] input WAV file path
 
 
140
 
141
 
142
  bash ./models/download-ggml-model.sh base.en
 
113
  -d N, --duration N [0 ] duration of audio to process in milliseconds
114
  -mc N, --max-context N [-1 ] maximum number of text context tokens to store
115
  -ml N, --max-len N [0 ] maximum segment length in characters
116
+ -sow, --split-on-word [false ] split on word rather than on token
117
+ -bo N, --best-of N [2 ] number of best candidates to keep
118
  -bs N, --beam-size N [-1 ] beam size for beam search
119
  -wt N, --word-thold N [0.01 ] word timestamp probability threshold
120
  -et N, --entropy-thold N [2.40 ] entropy threshold for decoder fail
121
  -lpt N, --logprob-thold N [-1.00 ] log probability threshold for decoder fail
122
+ -debug, --debug-mode [false ] enable debug mode (eg. dump log_mel)
123
  -tr, --translate [false ] translate from source language to english
 
124
  -di, --diarize [false ] stereo audio diarization
125
+ -tdrz, --tinydiarize [false ] enable tinydiarize (requires a tdrz model)
126
  -nf, --no-fallback [false ] do not use temperature fallback while decoding
127
  -otxt, --output-txt [false ] output result in a text file
128
  -ovtt, --output-vtt [false ] output result in a vtt file
129
  -osrt, --output-srt [false ] output result in a srt file
130
+ -olrc, --output-lrc [false ] output result in a lrc file
131
  -owts, --output-words [false ] output script for generating karaoke video
132
+ -fp, --font-path [/System/Library/Fonts/Supplemental/Courier New Bold.ttf] path to a monospace font for karaoke video
133
  -ocsv, --output-csv [false ] output result in a CSV file
134
+ -oj, --output-json [false ] output result in a JSON file
135
  -of FNAME, --output-file FNAME [ ] output file path (without file extension)
136
  -ps, --print-special [false ] print special tokens
137
  -pc, --print-colors [false ] print colors
138
  -pp, --print-progress [false ] print progress
139
+ -nt, --no-timestamps [false ] do not print timestamps
140
  -l LANG, --language LANG [en ] spoken language ('auto' for auto-detect)
141
+ -dl, --detect-language [false ] exit after automatically detecting language
142
  --prompt PROMPT [ ] initial prompt
143
  -m FNAME, --model FNAME [models/ggml-base.en.bin] model path
144
  -f FNAME, --file FNAME [ ] input WAV file path
145
+ -oved D, --ov-e-device DNAME [CPU ] the OpenVINO device used for encode inference
146
+ -ls, --log-score [false ] log best decoder scores of token
147
 
148
 
149
  bash ./models/download-ggml-model.sh base.en