基于 ONNX 的实时语音转文本输入法,C++ 跨平台实现。 核心组件: - Qt 6 跨平台 GUI(实时识别 / 文件转写 / 配置页面) - ONNX Runtime 推理引擎(异步模型加载) - PortAudio 音频采集 - dr_libs 音频文件解码 - JSON 配置管理(线程安全,自动持久化) - 日志系统(控制台 + 文件输出) Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>
30 lines
626 B
JSON
30 lines
626 B
JSON
{
|
|
"version": 1,
|
|
"stt": {
|
|
"model_path": "",
|
|
"model_type": "whisper",
|
|
"device": "cpu",
|
|
"num_threads": 4,
|
|
"sample_rate": 16000,
|
|
"language": "zh",
|
|
"streaming": true,
|
|
"beam_size": 5,
|
|
"temperature": 0.0
|
|
},
|
|
"audio": {
|
|
"input_device": -1,
|
|
"buffer_size_ms": 20,
|
|
"chunk_duration_ms": 3000,
|
|
"padding_ms": 500
|
|
},
|
|
"ui": {
|
|
"theme": "light",
|
|
"font_size": 14,
|
|
"show_waveform": true,
|
|
"show_confidence": true
|
|
},
|
|
"shortcuts": {
|
|
"toggle_recording": "Ctrl+Space"
|
|
}
|
|
}
|