I have been trying to set up a local STT using faster-whisper which is open ai compatible and it should be configured right in the json.
But when i send an audio message via either whatsapp or telegram openclaw is trying to use the image tool to decrypt it.
I am at a loss
"audio": {
"enabled": true,
"echoTranscript": true,
"echoFormat": "š {transcript}",
"attachments": {
"mode": "all",
"maxAttachments": 1
},
"maxBytes": 20971520,
"models": [
{
"provider": "openai",
"model": "base",
"providerOptions": {
"baseUrl": {
"default": "http://127.0.0.1:10300/v1"
},
"apiKey": {
"default": "sk-not-needed"
}
}
}
]
}