GET /tts?text=你好&voice=zh-CN-XiaoxiaoNeural&rate=0&pitch=0&format=audio/mpeg&download=true
POST /v1/audio/speech { "model": "0|0", "input": "你好世界", "voice": "zh-CN-XiaoxiaoNeural" }
GET /voices
GET /voices?locale=zh
GET /voices?format=yaml&detail=true
GET /voices?format=json_map