curl --location -g --request POST 'https://newapi.mexxxxai.win/v1beta/models/gemini-2.0-flash:generateContent?key={{GEMINI_API_KEY}}' \
--header 'Content-Type: application/json' \
--data-raw '{
"contents": [
{
"parts": [
{"inlineData": {"mimeType": "audio/mp3", "data": "<BASE64_ENCODED_AUDIO_DATA>"}},
{"text": "请转录并总结这段音频的内容。"}
]
}
],
"generationConfig": {"temperature": 0.3, "maxOutputTokens": 2048}
}'{
"candidates": [
{
"content": {
"parts": [
{
"text": "**转录内容:**\n\n【大家好,欢迎收听本期播客。今天我们邀请到了人工智能领域的专家张教授,一起聊聊大语言模型的最新进展……】\n\n**内容摘要:**\n\n本段音频为一期科技播客的开头部分,时长约45秒。主持人介绍了本期嘉宾张教授,并预告将围绕大语言模型(LLM)的技术发展和应用场景展开讨论。音频质量清晰,无明显噪音。"
}
],
"role": "model"
},
"finishReason": "STOP",
"index": 0
}
],
"usageMetadata": {
"promptTokenCount": 1240,
"candidatesTokenCount": 112,
"totalTokenCount": 1352
}
}