{"id":179,"date":"2026-03-21T22:47:21","date_gmt":"2026-03-21T14:47:21","guid":{"rendered":"https:\/\/pa.yingzhi8.cn\/index.php\/2026\/03\/21\/nodes-media-understanding\/"},"modified":"2026-03-21T23:08:56","modified_gmt":"2026-03-21T15:08:56","slug":"nodes-media-understanding","status":"publish","type":"post","link":"https:\/\/pa.yingzhi8.cn\/index.php\/2026\/03\/21\/nodes-media-understanding\/","title":{"rendered":"\u5a92\u4f53\u7406\u89e3"},"content":{"rendered":"<h1>\u5a92\u4f53\u7406\u89e3<\/h1>\n<h1>\u5a92\u4f53\u7406\u89e3\uff08\u5165\u7ad9\uff09\u2014 2026-01-17<\/h1>\n<p>OpenClaw \u53ef\u4ee5\u5728\u56de\u590d\u6d41\u7a0b\u8fd0\u884c\u4e4b\u524d<strong>\u6458\u8981\u5165\u7ad9\u5a92\u4f53<\/strong>\uff08\u56fe\u7247\/\u97f3\u9891\/\u89c6\u9891\uff09\u3002\u5b83\u4f1a\u81ea\u52a8\u68c0\u6d4b\u672c\u5730\u5de5\u5177\u6216\u63d0\u4f9b\u5546\u5bc6\u94a5\u662f\u5426\u53ef\u7528\uff0c\u5e76\u4e14\u53ef\u4ee5\u7981\u7528\u6216\u81ea\u5b9a\u4e49\u3002\u5982\u679c\u7406\u89e3\u5173\u95ed\uff0c\u6a21\u578b\u4ecd\u7136\u4f1a\u50cf\u5f80\u5e38\u4e00\u6837\u63a5\u6536\u539f\u59cb\u6587\u4ef6\/URL\u3002<\/p>\n<h2>\u76ee\u6807<\/h2>\n<ul>\n<li>\u53ef\u9009\uff1a\u5c06\u5165\u7ad9\u5a92\u4f53\u9884\u5148\u6d88\u5316\u4e3a\u77ed\u6587\u672c\uff0c\u4ee5\u4fbf\u66f4\u5feb\u8def\u7531 + \u66f4\u597d\u7684\u547d\u4ee4\u89e3\u6790\u3002<\/li>\n<li>\u4fdd\u7559\u539f\u59cb\u5a92\u4f53\u4f20\u9012\u7ed9\u6a21\u578b\uff08\u59cb\u7ec8\uff09\u3002<\/li>\n<li>\u652f\u6301<strong>\u63d0\u4f9b\u5546 API<\/strong> \u548c <strong>CLI \u56de\u9000<\/strong>\u3002<\/li>\n<li>\u5141\u8bb8\u591a\u4e2a\u6a21\u578b\u5e76\u6309\u987a\u5e8f\u56de\u9000\uff08\u9519\u8bef\/\u5927\u5c0f\/\u8d85\u65f6\uff09\u3002<\/li>\n<\/ul>\n<h2>\u9ad8\u5c42\u884c\u4e3a<\/h2>\n<ol>\n<li>\u6536\u96c6\u5165\u7ad9\u9644\u4ef6\uff08<code>MediaPaths<\/code>\u3001<code>MediaUrls<\/code>\u3001<code>MediaTypes<\/code>\uff09\u3002<\/li>\n<li>\u5bf9\u4e8e\u6bcf\u4e2a\u542f\u7528\u7684\u80fd\u529b\uff08\u56fe\u7247\/\u97f3\u9891\/\u89c6\u9891\uff09\uff0c\u6839\u636e\u7b56\u7565\u9009\u62e9\u9644\u4ef6\uff08\u9ed8\u8ba4\uff1a<strong>\u7b2c\u4e00\u4e2a<\/strong>\uff09\u3002<\/li>\n<li>\u9009\u62e9\u7b2c\u4e00\u4e2a\u7b26\u5408\u6761\u4ef6\u7684\u6a21\u578b\u6761\u76ee\uff08\u5927\u5c0f + \u80fd\u529b + \u8ba4\u8bc1\uff09\u3002<\/li>\n<li>\u5982\u679c\u6a21\u578b\u5931\u8d25\u6216\u5a92\u4f53\u592a\u5927\uff0c<strong>\u56de\u9000\u5230\u4e0b\u4e00\u4e2a\u6761\u76ee<\/strong>\u3002<\/li>\n<li>\u6210\u529f\u65f6\uff1a<br \/>\n   * <code>Body<\/code> \u53d8\u4e3a <code>[Image]<\/code>\u3001<code>[Audio]<\/code> \u6216 <code>[Video]<\/code> \u5757\u3002<br \/>\n   * \u97f3\u9891\u8bbe\u7f6e <code>{{Transcript}}<\/code>\uff1b\u547d\u4ee4\u89e3\u6790\u5728\u6709\u6807\u9898\u6587\u672c\u65f6\u4f7f\u7528\u6807\u9898\u6587\u672c\uff0c\u5426\u5219\u4f7f\u7528\u8f6c\u5f55\u3002<br \/>\n   * \u6807\u9898\u4f5c\u4e3a <code>User text:<\/code> \u4fdd\u7559\u5728\u5757\u5185\u3002<\/li>\n<\/ol>\n<p>\u5982\u679c\u7406\u89e3\u5931\u8d25\u6216\u88ab\u7981\u7528\uff0c<strong>\u56de\u590d\u6d41\u7a0b\u7ee7\u7eed<\/strong>\u4f7f\u7528\u539f\u59cb\u6b63\u6587 + \u9644\u4ef6\u3002<\/p>\n<h2>\u914d\u7f6e\u6982\u8ff0<\/h2>\n<p><code>tools.media<\/code> \u652f\u6301<strong>\u5171\u4eab\u6a21\u578b<\/strong>\u52a0\u4e0a\u6bcf\u80fd\u529b\u8986\u76d6\uff1a<\/p>\n<ul>\n<li><code>tools.media.models<\/code>\uff1a\u5171\u4eab\u6a21\u578b\u5217\u8868\uff08\u4f7f\u7528 <code>capabilities<\/code> \u6765\u9650\u5b9a\uff09\u3002<\/li>\n<li><code>tools.media.image<\/code> \/ <code>tools.media.audio<\/code> \/ <code>tools.media.video<\/code>\uff1a<\/li>\n<li>\u9ed8\u8ba4\u503c\uff08<code>prompt<\/code>\u3001<code>maxChars<\/code>\u3001<code>maxBytes<\/code>\u3001<code>timeoutSeconds<\/code>\u3001<code>language<\/code>\uff09<\/li>\n<li>\u63d0\u4f9b\u5546\u8986\u76d6\uff08<code>baseUrl<\/code>\u3001<code>headers<\/code>\u3001<code>providerOptions<\/code>\uff09<\/li>\n<li>\u901a\u8fc7 <code>tools.media.audio.providerOptions.deepgram<\/code> \u914d\u7f6e Deepgram \u97f3\u9891\u9009\u9879<\/li>\n<li>\u53ef\u9009\u7684<strong>\u6bcf\u80fd\u529b <code>models<\/code> \u5217\u8868<\/strong>\uff08\u4f18\u5148\u4e8e\u5171\u4eab\u6a21\u578b\uff09<\/li>\n<li><code>attachments<\/code> \u7b56\u7565\uff08<code>mode<\/code>\u3001<code>maxAttachments<\/code>\u3001<code>prefer<\/code>\uff09<\/li>\n<li><code>scope<\/code>\uff08\u53ef\u9009\u7684\u6309\u6e20\u9053\/\u804a\u5929\u7c7b\u578b\/\u4f1a\u8bdd\u952e\u9650\u5b9a\uff09<\/li>\n<li><code>tools.media.concurrency<\/code>\uff1a\u6700\u5927\u5e76\u53d1\u80fd\u529b\u8fd0\u884c\u6570\uff08\u9ed8\u8ba4 <strong>2<\/strong>\uff09\u3002<\/li>\n<\/ul>\n<p>&#8220;`json5  theme={&#8220;theme&#8221;:{&#8220;light&#8221;:&#8221;min-light&#8221;,&#8221;dark&#8221;:&#8221;min-dark&#8221;}}<br \/>\n{<br \/>\n  tools: {<br \/>\n    media: {<br \/>\n      models: [<br \/>\n        \/<em> \u5171\u4eab\u5217\u8868 <\/em>\/<br \/>\n      ],<br \/>\n      image: {<br \/>\n        \/<em> \u53ef\u9009\u8986\u76d6 <\/em>\/<br \/>\n      },<br \/>\n      audio: {<br \/>\n        \/<em> \u53ef\u9009\u8986\u76d6 <\/em>\/<br \/>\n      },<br \/>\n      video: {<br \/>\n        \/<em> \u53ef\u9009\u8986\u76d6 <\/em>\/<br \/>\n      },<br \/>\n    },<br \/>\n  },<br \/>\n}<\/p>\n<pre><code>\n### \u6a21\u578b\u6761\u76ee\n\n\u6bcf\u4e2a `models[]` \u6761\u76ee\u53ef\u4ee5\u662f**\u63d0\u4f9b\u5546**\u6216 **CLI**\uff1a\n\n```json5  theme={&quot;theme&quot;:{&quot;light&quot;:&quot;min-light&quot;,&quot;dark&quot;:&quot;min-dark&quot;}}\n{\n  type: &quot;provider&quot;, \/\/ \u7701\u7565\u65f6\u9ed8\u8ba4\n  provider: &quot;openai&quot;,\n  model: &quot;gpt-5.2&quot;,\n  prompt: &quot;Describe the image in &lt;= 500 chars.&quot;,\n  maxChars: 500,\n  maxBytes: 10485760,\n  timeoutSeconds: 60,\n  capabilities: [&quot;image&quot;], \/\/ \u53ef\u9009\uff0c\u7528\u4e8e\u591a\u6a21\u6001\u6761\u76ee\n  profile: &quot;vision-profile&quot;,\n  preferredProfile: &quot;vision-fallback&quot;,\n}\n<\/code><\/pre>\n<p>&#8220;`json5  theme={&#8220;theme&#8221;:{&#8220;light&#8221;:&#8221;min-light&#8221;,&#8221;dark&#8221;:&#8221;min-dark&#8221;}}<br \/>\n{<br \/>\n  type: &#8220;cli&#8221;,<br \/>\n  command: &#8220;gemini&#8221;,<br \/>\n  args: [<br \/>\n    &#8220;-m&#8221;,<br \/>\n    &#8220;gemini-3-flash&#8221;,<br \/>\n    &#8220;&#8211;allowed-tools&#8221;,<br \/>\n    &#8220;read_file&#8221;,<br \/>\n    &#8220;Read the media at {{MediaPath}} and describe it in &lt;= {{MaxChars}} characters.&#8221;,<br \/>\n  ],<br \/>\n  maxChars: 500,<br \/>\n  maxBytes: 52428800,<br \/>\n  timeoutSeconds: 120,<br \/>\n  capabilities: [&#8220;video&#8221;, &#8220;image&#8221;],<br \/>\n}<\/p>\n<pre><code>\nCLI \u6a21\u677f\u8fd8\u53ef\u4ee5\u4f7f\u7528\uff1a\n\n* `{{MediaDir}}`\uff08\u5305\u542b\u5a92\u4f53\u6587\u4ef6\u7684\u76ee\u5f55\uff09\n* `{{OutputDir}}`\uff08\u4e3a\u672c\u6b21\u8fd0\u884c\u521b\u5efa\u7684\u4e34\u65f6\u76ee\u5f55\uff09\n* `{{OutputBase}}`\uff08\u4e34\u65f6\u6587\u4ef6\u57fa\u7840\u8def\u5f84\uff0c\u65e0\u6269\u5c55\u540d\uff09\n\n## \u9ed8\u8ba4\u503c\u548c\u9650\u5236\n\n\u63a8\u8350\u9ed8\u8ba4\u503c\uff1a\n\n* `maxChars`\uff1a\u56fe\u7247\/\u89c6\u9891\u4e3a **500**\uff08\u7b80\u77ed\uff0c\u9002\u5408\u547d\u4ee4\uff09\n* `maxChars`\uff1a\u97f3\u9891**\u4e0d\u8bbe\u7f6e**\uff08\u5b8c\u6574\u8f6c\u5f55\uff0c\u9664\u975e\u4f60\u8bbe\u7f6e\u9650\u5236\uff09\n* `maxBytes`\uff1a\n  * \u56fe\u7247\uff1a**10MB**\n  * \u97f3\u9891\uff1a**20MB**\n  * \u89c6\u9891\uff1a**50MB**\n\n\u89c4\u5219\uff1a\n\n* \u5982\u679c\u5a92\u4f53\u8d85\u8fc7 `maxBytes`\uff0c\u8be5\u6a21\u578b\u88ab\u8df3\u8fc7\uff0c**\u5c1d\u8bd5\u4e0b\u4e00\u4e2a\u6a21\u578b**\u3002\n* \u5982\u679c\u6a21\u578b\u8fd4\u56de\u8d85\u8fc7 `maxChars`\uff0c\u8f93\u51fa\u88ab\u622a\u65ad\u3002\n* `prompt` \u9ed8\u8ba4\u4e3a\u7b80\u5355\u7684&quot;Describe the {media}.&quot;\u52a0\u4e0a `maxChars` \u6307\u5bfc\uff08\u4ec5\u56fe\u7247\/\u89c6\u9891\uff09\u3002\n* \u5982\u679c `&lt;capability&gt;.enabled: true` \u4f46\u672a\u914d\u7f6e\u6a21\u578b\uff0c\u5f53\u63d0\u4f9b\u5546\u652f\u6301\u8be5\u80fd\u529b\u65f6\uff0cOpenClaw \u5c1d\u8bd5**\u6d3b\u52a8\u7684\u56de\u590d\u6a21\u578b**\u3002\n\n### \u81ea\u52a8\u68c0\u6d4b\u5a92\u4f53\u7406\u89e3\uff08\u9ed8\u8ba4\uff09\n\n\u5982\u679c `tools.media.&lt;capability&gt;.enabled` **\u672a**\u8bbe\u7f6e\u4e3a `false` \u4e14\u4f60\u6ca1\u6709\u914d\u7f6e\u6a21\u578b\uff0cOpenClaw \u6309\u4ee5\u4e0b\u987a\u5e8f\u81ea\u52a8\u68c0\u6d4b\u5e76**\u5728\u7b2c\u4e00\u4e2a\u53ef\u7528\u9009\u9879\u5904\u505c\u6b62**\uff1a\n\n1. **\u672c\u5730 CLI**\uff08\u4ec5\u97f3\u9891\uff1b\u5982\u679c\u5df2\u5b89\u88c5\uff09\n   * `sherpa-onnx-offline`\uff08\u9700\u8981\u5e26\u6709 encoder\/decoder\/joiner\/tokens \u7684 `SHERPA_ONNX_MODEL_DIR`\uff09\n   * `whisper-cli`\uff08`whisper-cpp`\uff1b\u4f7f\u7528 `WHISPER_CPP_MODEL` \u6216\u6346\u7ed1\u7684 tiny \u6a21\u578b\uff09\n   * `whisper`\uff08Python CLI\uff1b\u81ea\u52a8\u4e0b\u8f7d\u6a21\u578b\uff09\n2. **Gemini CLI**\uff08`gemini`\uff09\u4f7f\u7528 `read_many_files`\n3. **\u63d0\u4f9b\u5546\u5bc6\u94a5**\n   * \u97f3\u9891\uff1aOpenAI \u2192 Groq \u2192 Deepgram \u2192 Google\n   * \u56fe\u7247\uff1aOpenAI \u2192 Anthropic \u2192 Google \u2192 MiniMax\n   * \u89c6\u9891\uff1aGoogle\n\n\u8981\u7981\u7528\u81ea\u52a8\u68c0\u6d4b\uff0c\u8bbe\u7f6e\uff1a\n\n```json5  theme={&quot;theme&quot;:{&quot;light&quot;:&quot;min-light&quot;,&quot;dark&quot;:&quot;min-dark&quot;}}\n{\n  tools: {\n    media: {\n      audio: {\n        enabled: false,\n      },\n    },\n  },\n}\n<\/code><\/pre>\n<p>\u6ce8\u610f\uff1a\u4e8c\u8fdb\u5236\u6587\u4ef6\u68c0\u6d4b\u5728 macOS\/Linux\/Windows \u4e0a\u662f\u5c3d\u529b\u800c\u4e3a\u7684\uff1b\u786e\u4fdd CLI \u5728 <code>PATH<\/code> \u4e0a\uff08\u6211\u4eec\u4f1a\u5c55\u5f00 <code>~<\/code>\uff09\uff0c\u6216\u8bbe\u7f6e\u5e26\u6709\u5b8c\u6574\u547d\u4ee4\u8def\u5f84\u7684\u663e\u5f0f CLI \u6a21\u578b\u3002<\/p>\n<h2>\u80fd\u529b\uff08\u53ef\u9009\uff09<\/h2>\n<p>\u5982\u679c\u4f60\u8bbe\u7f6e\u4e86 <code>capabilities<\/code>\uff0c\u8be5\u6761\u76ee\u4ec5\u5bf9\u8fd9\u4e9b\u5a92\u4f53\u7c7b\u578b\u8fd0\u884c\u3002\u5bf9\u4e8e\u5171\u4eab\u5217\u8868\uff0cOpenClaw \u53ef\u4ee5\u63a8\u65ad\u9ed8\u8ba4\u503c\uff1a<\/p>\n<ul>\n<li><code>openai<\/code>\u3001<code>anthropic<\/code>\u3001<code>minimax<\/code>\uff1a<strong>\u56fe\u7247<\/strong><\/li>\n<li><code>google<\/code>\uff08Gemini API\uff09\uff1a<strong>\u56fe\u7247 + \u97f3\u9891 + \u89c6\u9891<\/strong><\/li>\n<li><code>groq<\/code>\uff1a<strong>\u97f3\u9891<\/strong><\/li>\n<li><code>deepgram<\/code>\uff1a<strong>\u97f3\u9891<\/strong><\/li>\n<\/ul>\n<p>\u5bf9\u4e8e CLI \u6761\u76ee\uff0c<strong>\u663e\u5f0f\u8bbe\u7f6e <code>capabilities<\/code><\/strong> \u4ee5\u907f\u514d\u610f\u5916\u5339\u914d\u3002\u5982\u679c\u4f60\u7701\u7565 <code>capabilities<\/code>\uff0c\u8be5\u6761\u76ee\u5bf9\u5b83\u51fa\u73b0\u7684\u5217\u8868\u90fd\u7b26\u5408\u6761\u4ef6\u3002<\/p>\n<h2>\u63d0\u4f9b\u5546\u652f\u6301\u77e9\u9635\uff08OpenClaw \u96c6\u6210\uff09<\/h2>\n<table>\n<thead>\n<tr>\n<th>\u80fd\u529b<\/th>\n<th>\u63d0\u4f9b\u5546\u96c6\u6210<\/th>\n<th>\u8bf4\u660e<\/th>\n<\/tr>\n<\/thead>\n<tbody>\n<tr>\n<td>\u56fe\u7247<\/td>\n<td>OpenAI \/ Anthropic \/ Google \/ \u5176\u4ed6\u901a\u8fc7 <code>pi-ai<\/code><\/td>\n<td>\u6ce8\u518c\u8868\u4e2d\u4efb\u4f55\u652f\u6301\u56fe\u7247\u7684\u6a21\u578b\u90fd\u53ef\u7528\u3002<\/td>\n<\/tr>\n<tr>\n<td>\u97f3\u9891<\/td>\n<td>OpenAI\u3001Groq\u3001Deepgram\u3001Google<\/td>\n<td>\u63d0\u4f9b\u5546\u8f6c\u5f55\uff08Whisper\/Deepgram\/Gemini\uff09\u3002<\/td>\n<\/tr>\n<tr>\n<td>\u89c6\u9891<\/td>\n<td>Google\uff08Gemini API\uff09<\/td>\n<td>\u63d0\u4f9b\u5546\u89c6\u9891\u7406\u89e3\u3002<\/td>\n<\/tr>\n<\/tbody>\n<\/table>\n<h2>\u63a8\u8350\u63d0\u4f9b\u5546<\/h2>\n<p><strong>\u56fe\u7247<\/strong><\/p>\n<ul>\n<li>\u5982\u679c\u652f\u6301\u56fe\u7247\uff0c\u4f18\u5148\u4f7f\u7528\u4f60\u7684\u6d3b\u52a8\u6a21\u578b\u3002<\/li>\n<li>\u826f\u597d\u7684\u9ed8\u8ba4\u503c\uff1a<code>openai\/gpt-5.2<\/code>\u3001<code>anthropic\/claude-opus-4-5<\/code>\u3001<code>google\/gemini-3-pro-preview<\/code>\u3002<\/li>\n<\/ul>\n<p><strong>\u97f3\u9891<\/strong><\/p>\n<ul>\n<li><code>openai\/gpt-4o-mini-transcribe<\/code>\u3001<code>groq\/whisper-large-v3-turbo<\/code> \u6216 <code>deepgram\/nova-3<\/code>\u3002<\/li>\n<li>CLI \u56de\u9000\uff1a<code>whisper-cli<\/code>\uff08whisper-cpp\uff09\u6216 <code>whisper<\/code>\u3002<\/li>\n<li>Deepgram \u8bbe\u7f6e\uff1a<a href=\"\/providers\/deepgram\">Deepgram\uff08\u97f3\u9891\u8f6c\u5f55\uff09<\/a>\u3002<\/li>\n<\/ul>\n<p><strong>\u89c6\u9891<\/strong><\/p>\n<ul>\n<li><code>google\/gemini-3-flash-preview<\/code>\uff08\u5feb\u901f\uff09\u3001<code>google\/gemini-3-pro-preview<\/code>\uff08\u66f4\u4e30\u5bcc\uff09\u3002<\/li>\n<li>CLI \u56de\u9000\uff1a<code>gemini<\/code> CLI\uff08\u652f\u6301\u5bf9\u89c6\u9891\/\u97f3\u9891\u4f7f\u7528 <code>read_file<\/code>\uff09\u3002<\/li>\n<\/ul>\n<h2>\u9644\u4ef6\u7b56\u7565<\/h2>\n<p>\u6bcf\u80fd\u529b\u7684 <code>attachments<\/code> \u63a7\u5236\u5904\u7406\u54ea\u4e9b\u9644\u4ef6\uff1a<\/p>\n<ul>\n<li><code>mode<\/code>\uff1a<code>first<\/code>\uff08\u9ed8\u8ba4\uff09\u6216 <code>all<\/code><\/li>\n<li><code>maxAttachments<\/code>\uff1a\u9650\u5236\u5904\u7406\u6570\u91cf\uff08\u9ed8\u8ba4 <strong>1<\/strong>\uff09<\/li>\n<li><code>prefer<\/code>\uff1a<code>first<\/code>\u3001<code>last<\/code>\u3001<code>path<\/code>\u3001<code>url<\/code><\/li>\n<\/ul>\n<p>\u5f53 <code>mode: \"all\"<\/code> \u65f6\uff0c\u8f93\u51fa\u6807\u8bb0\u4e3a <code>[Image 1\/2]<\/code>\u3001<code>[Audio 2\/2]<\/code> \u7b49\u3002<\/p>\n<h2>\u914d\u7f6e\u793a\u4f8b<\/h2>\n<h3>1) \u5171\u4eab\u6a21\u578b\u5217\u8868 + \u8986\u76d6<\/h3>\n<p>&#8220;`json5  theme={&#8220;theme&#8221;:{&#8220;light&#8221;:&#8221;min-light&#8221;,&#8221;dark&#8221;:&#8221;min-dark&#8221;}}<br \/>\n{<br \/>\n  tools: {<br \/>\n    media: {<br \/>\n      models: [<br \/>\n        { provider: &#8220;openai&#8221;, model: &#8220;gpt-5.2&#8221;, capabilities: [&#8220;image&#8221;] },<br \/>\n        {<br \/>\n          provider: &#8220;google&#8221;,<br \/>\n          model: &#8220;gemini-3-flash-preview&#8221;,<br \/>\n          capabilities: [&#8220;image&#8221;, &#8220;audio&#8221;, &#8220;video&#8221;],<br \/>\n        },<br \/>\n        {<br \/>\n          type: &#8220;cli&#8221;,<br \/>\n          command: &#8220;gemini&#8221;,<br \/>\n          args: [<br \/>\n            &#8220;-m&#8221;,<br \/>\n            &#8220;gemini-3-flash&#8221;,<br \/>\n            &#8220;&#8211;allowed-tools&#8221;,<br \/>\n            &#8220;read_file&#8221;,<br \/>\n            &#8220;Read the media at {{MediaPath}} and describe it in &lt;= {{MaxChars}} characters.&#8221;,<br \/>\n          ],<br \/>\n          capabilities: [&#8220;image&#8221;, &#8220;video&#8221;],<br \/>\n        },<br \/>\n      ],<br \/>\n      audio: {<br \/>\n        attachments: { mode: &#8220;all&#8221;, maxAttachments: 2 },<br \/>\n      },<br \/>\n      video: {<br \/>\n        maxChars: 500,<br \/>\n      },<br \/>\n    },<br \/>\n  },<br \/>\n}<\/p>\n<pre><code>\n### 2) \u4ec5\u97f3\u9891 + \u89c6\u9891\uff08\u56fe\u7247\u5173\u95ed\uff09\n\n```json5  theme={&quot;theme&quot;:{&quot;light&quot;:&quot;min-light&quot;,&quot;dark&quot;:&quot;min-dark&quot;}}\n{\n  tools: {\n    media: {\n      audio: {\n        enabled: true,\n        models: [\n          { provider: &quot;openai&quot;, model: &quot;gpt-4o-mini-transcribe&quot; },\n          {\n            type: &quot;cli&quot;,\n            command: &quot;whisper&quot;,\n            args: [&quot;--model&quot;, &quot;base&quot;, &quot;{{MediaPath}}&quot;],\n          },\n        ],\n      },\n      video: {\n        enabled: true,\n        maxChars: 500,\n        models: [\n          { provider: &quot;google&quot;, model: &quot;gemini-3-flash-preview&quot; },\n          {\n            type: &quot;cli&quot;,\n            command: &quot;gemini&quot;,\n            args: [\n              &quot;-m&quot;,\n              &quot;gemini-3-flash&quot;,\n              &quot;--allowed-tools&quot;,\n              &quot;read_file&quot;,\n              &quot;Read the media at {{MediaPath}} and describe it in &lt;= {{MaxChars}} characters.&quot;,\n            ],\n          },\n        ],\n      },\n    },\n  },\n}\n<\/code><\/pre>\n<h3>3) \u53ef\u9009\u56fe\u7247\u7406\u89e3<\/h3>\n<p>&#8220;`json5  theme={&#8220;theme&#8221;:{&#8220;light&#8221;:&#8221;min-light&#8221;,&#8221;dark&#8221;:&#8221;min-dark&#8221;}}<br \/>\n{<br \/>\n  tools: {<br \/>\n    media: {<br \/>\n      image: {<br \/>\n        enabled: true,<br \/>\n        maxBytes: 10485760,<br \/>\n        maxChars: 500,<br \/>\n        models: [<br \/>\n          { provider: &#8220;openai&#8221;, model: &#8220;gpt-5.2&#8221; },<br \/>\n          { provider: &#8220;anthropic&#8221;, model: &#8220;claude-opus-4-5&#8221; },<br \/>\n          {<br \/>\n            type: &#8220;cli&#8221;,<br \/>\n            command: &#8220;gemini&#8221;,<br \/>\n            args: [<br \/>\n              &#8220;-m&#8221;,<br \/>\n              &#8220;gemini-3-flash&#8221;,<br \/>\n              &#8220;&#8211;allowed-tools&#8221;,<br \/>\n              &#8220;read_file&#8221;,<br \/>\n              &#8220;Read the media at {{MediaPath}} and describe it in &lt;= {{MaxChars}} characters.&#8221;,<br \/>\n            ],<br \/>\n          },<br \/>\n        ],<br \/>\n      },<br \/>\n    },<br \/>\n  },<br \/>\n}<\/p>\n<pre><code>\n### 4) \u591a\u6a21\u6001\u5355\u6761\u76ee\uff08\u663e\u5f0f\u80fd\u529b\uff09\n\n```json5  theme={&quot;theme&quot;:{&quot;light&quot;:&quot;min-light&quot;,&quot;dark&quot;:&quot;min-dark&quot;}}\n{\n  tools: {\n    media: {\n      image: {\n        models: [\n          {\n            provider: &quot;google&quot;,\n            model: &quot;gemini-3-pro-preview&quot;,\n            capabilities: [&quot;image&quot;, &quot;video&quot;, &quot;audio&quot;],\n          },\n        ],\n      },\n      audio: {\n        models: [\n          {\n            provider: &quot;google&quot;,\n            model: &quot;gemini-3-pro-preview&quot;,\n            capabilities: [&quot;image&quot;, &quot;video&quot;, &quot;audio&quot;],\n          },\n        ],\n      },\n      video: {\n        models: [\n          {\n            provider: &quot;google&quot;,\n            model: &quot;gemini-3-pro-preview&quot;,\n            capabilities: [&quot;image&quot;, &quot;video&quot;, &quot;audio&quot;],\n          },\n        ],\n      },\n    },\n  },\n}\n<\/code><\/pre>\n<h2>\u72b6\u6001\u8f93\u51fa<\/h2>\n<p>\u5f53\u5a92\u4f53\u7406\u89e3\u8fd0\u884c\u65f6\uff0c<code>\/status<\/code> \u5305\u542b\u4e00\u884c\u7b80\u77ed\u6458\u8981\uff1a<\/p>\n<pre><code>\ud83d\udcce Media: image ok (openai\/gpt-5.2) \u00b7 audio skipped (maxBytes)\n<\/code><\/pre>\n<p>\u8fd9\u663e\u793a\u6bcf\u80fd\u529b\u7684\u7ed3\u679c\u4ee5\u53ca\u9002\u7528\u65f6\u9009\u62e9\u7684\u63d0\u4f9b\u5546\/\u6a21\u578b\u3002<\/p>\n<h2>\u6ce8\u610f\u4e8b\u9879<\/h2>\n<ul>\n<li>\u7406\u89e3\u662f<strong>\u5c3d\u529b\u800c\u4e3a<\/strong>\u7684\u3002\u9519\u8bef\u4e0d\u4f1a\u963b\u6b62\u56de\u590d\u3002<\/li>\n<li>\u5373\u4f7f\u7406\u89e3\u88ab\u7981\u7528\uff0c\u9644\u4ef6\u4ecd\u7136\u4f20\u9012\u7ed9\u6a21\u578b\u3002<\/li>\n<li>\u4f7f\u7528 <code>scope<\/code> \u9650\u5236\u7406\u89e3\u8fd0\u884c\u7684\u4f4d\u7f6e\uff08\u4f8b\u5982\u4ec5\u79c1\u4fe1\uff09\u3002<\/li>\n<\/ul>\n<h2>\u76f8\u5173\u6587\u6863<\/h2>\n<ul>\n<li><a href=\"\/gateway\/configuration\">\u914d\u7f6e<\/a><\/li>\n<li><a href=\"\/nodes\/images\">\u56fe\u7247\u548c\u5a92\u4f53\u652f\u6301<\/a><\/li>\n<\/ul>\n","protected":false},"excerpt":{"rendered":"<p>\u5a92\u4f53\u7406\u89e3 \u5a92\u4f53\u7406\u89e3\uff08\u5165\u7ad9\uff09\u2014 2026-01-17 OpenClaw \u53ef\u4ee5\u5728\u56de\u590d\u6d41\u7a0b\u8fd0\u884c\u4e4b\u524d\u6458\u8981\u5165\u7ad9\u5a92\u4f53\uff08\u56fe\u7247 [&hellip;]<\/p>\n","protected":false},"author":0,"featured_media":0,"comment_status":"open","ping_status":"open","sticky":false,"template":"","format":"standard","meta":{"footnotes":""},"categories":[2],"tags":[],"class_list":["post-179","post","type-post","status-publish","format-standard","hentry","category-docs"],"_links":{"self":[{"href":"https:\/\/pa.yingzhi8.cn\/index.php\/wp-json\/wp\/v2\/posts\/179","targetHints":{"allow":["GET"]}}],"collection":[{"href":"https:\/\/pa.yingzhi8.cn\/index.php\/wp-json\/wp\/v2\/posts"}],"about":[{"href":"https:\/\/pa.yingzhi8.cn\/index.php\/wp-json\/wp\/v2\/types\/post"}],"replies":[{"embeddable":true,"href":"https:\/\/pa.yingzhi8.cn\/index.php\/wp-json\/wp\/v2\/comments?post=179"}],"version-history":[{"count":1,"href":"https:\/\/pa.yingzhi8.cn\/index.php\/wp-json\/wp\/v2\/posts\/179\/revisions"}],"predecessor-version":[{"id":474,"href":"https:\/\/pa.yingzhi8.cn\/index.php\/wp-json\/wp\/v2\/posts\/179\/revisions\/474"}],"wp:attachment":[{"href":"https:\/\/pa.yingzhi8.cn\/index.php\/wp-json\/wp\/v2\/media?parent=179"}],"wp:term":[{"taxonomy":"category","embeddable":true,"href":"https:\/\/pa.yingzhi8.cn\/index.php\/wp-json\/wp\/v2\/categories?post=179"},{"taxonomy":"post_tag","embeddable":true,"href":"https:\/\/pa.yingzhi8.cn\/index.php\/wp-json\/wp\/v2\/tags?post=179"}],"curies":[{"name":"wp","href":"https:\/\/api.w.org\/{rel}","templated":true}]}}