[{"data":1,"prerenderedAt":4100},["ShallowReactive",2],{"header-counts":3,"footer-counts":6,"tool-tools\u002Fcoding\u002Fapi\u002Fone-api":9,"tool-stats-coding\u002Fapi\u002Fone-api":776,"cat-rank-coding-api":779,"tool-related-coding\u002Fapi\u002Fone-api":4099},{"tools":4,"reviews":5},65,7,{"tools":4,"reviews":5,"playbooks":7,"news":8},10,8,{"id":10,"title":11,"alternatives":12,"api_compatible":25,"body":26,"category":708,"chinese_friendly":289,"cover":709,"description":710,"domestic":711,"extension":712,"faq":713,"free":711,"github":25,"languages":726,"meta":729,"models":25,"navigation":312,"notSuitable":25,"opensource":312,"path":730,"pillar":731,"platforms":732,"priceTable":735,"pricing":129,"published":746,"relatedPlaybooks":747,"relatedReviews":25,"score":751,"self_host":312,"seo":752,"slug":753,"sources":754,"stem":764,"suitable":25,"tagline":765,"tags":766,"updated":757,"verdict":774,"website":683,"__hash__":775},"tools\u002Ftools\u002Fcoding\u002Fapi\u002Fone-api.md","One-API",[13,16,19,22],{"name":14,"url":15},"litellm","\u002Ftools\u002Fcoding\u002Fapi\u002Flitellm",{"name":17,"url":18},"openrouter","\u002Ftools\u002Fcoding\u002Fapi\u002Fopenrouter",{"name":20,"url":21},"portkey","\u002Ftools\u002Fcoding\u002Fapi\u002Fportkey",{"name":23,"url":24},"helicone","\u002Ftools\u002Fcoding\u002Fapi\u002Fhelicone",null,{"type":27,"value":28,"toc":696},"minimark",[29,34,43,46,49,120,123,137,143,147,152,177,182,208,212,360,363,540,543,598,602,631,634,657,660,692],[30,31,33],"h2",{"id":32},"tldr","TL;DR",[35,36,37,38,42],"p",{},"One-API 是国内最流行的开源 LLM API 网关——JustSong 用 Go 写的 OpenAI 兼容代理，GitHub 18K+ Star，",[39,40,41],"code",{},"docker run"," 一行起一个能用的 AI API 平台。30+ 厂商（海外 + 国内全覆盖）统一 OpenAI 格式，内置中文 UI + Key 管理 + 渠道分组 + 负载均衡 + 额度系统 + 邀请返佣。衍生项目 new-api（QuantumNous）增强多租户、缓存独立计费、内置 EPay \u002F Stripe 支付、Claude \u002F Gemini 原生格式、多种登录方式——已成为商业化中转站的事实底座。",[35,44,45],{},"适合：国内个人 \u002F 小团队自建 LLM 网关 + 多账号轮询；企业内部统一多厂商 API 入口 + 中文运营；学习 LLM 网关架构。不适合：微服务架构 \u002F 多语言客户端（走 LiteLLM）；不想运维（走 OpenRouter \u002F Portkey）；向中国境内公众提供未备案服务（违法）。",[30,47,48],{"id":48},"核心能力",[50,51,52,60,66,72,78,84,90,96,102,108,114],"ul",{},[53,54,55,59],"li",{},[56,57,58],"strong",{},"30+ 厂商","：OpenAI \u002F Claude \u002F Gemini \u002F Mistral \u002F Groq \u002F xAI；DeepSeek \u002F 通义 \u002F 文心 \u002F 讯飞 \u002F 智谱 \u002F 豆包 \u002F Moonshot \u002F 百川 \u002F MiniMax \u002F 零一万物 \u002F 阶跃星辰；Ollama \u002F Cloudflare Workers AI 等",[53,61,62,65],{},[56,63,64],{},"Key 管理","：生成 \u002F 分发 \u002F 过期 \u002F 额度控制",[53,67,68,71],{},[56,69,70],{},"渠道分组","：批量创建 \u002F 分组 \u002F 模型映射",[53,73,74,77],{},[56,75,76],{},"负载均衡","：多 Key 轮询 + 失败自动重试",[53,79,80,83],{},[56,81,82],{},"额度系统","：用户额度 \u002F 兑换码 \u002F 邀请返佣",[53,85,86,89],{},[56,87,88],{},"日志监控","：请求日志 \u002F 额度明细 \u002F 报警",[53,91,92,95],{},[56,93,94],{},"权限控制","：IP 白名单 \u002F Token 分组 \u002F 模型限制",[53,97,98,101],{},[56,99,100],{},"多输出格式","：OpenAI \u002F Claude \u002F Gemini 原生（new-api）",[53,103,104,107],{},[56,105,106],{},"多登录方式","：邮箱 \u002F GitHub \u002F 飞书；new-api 加 Discord \u002F Telegram \u002F LinuxDO \u002F OIDC",[53,109,110,113],{},[56,111,112],{},"Docker 一键部署","：SQLite（小规模）\u002F MySQL（生产）",[53,115,116,119],{},[56,117,118],{},"多语言 UI","：中文 \u002F 英文 \u002F 日文",[30,121,122],{"id":122},"价格",[50,124,125,131,134],{},[53,126,127,130],{},[56,128,129],{},"MIT 开源免费","，自托管成本 = 1 台 VPS（最小 1 核 1G 跑 SQLite 版）",[53,132,133],{},"上游模型成本走各厂商直接结算",[53,135,136],{},"new-api 内置 EPay \u002F Stripe 支付，可对接支付宝当面付 \u002F 微信支付（自行二开）",[138,139,140],"blockquote",{},[35,141,142],{},"部署起步：阿里云 \u002F 腾讯云轻量 1 核 1G 月 ¥30，配 Cloudflare CDN 全套月不到 ¥50。",[30,144,146],{"id":145},"实测5-人创业团队-内部统一-api-入口","实测（5 人创业团队 + 内部统一 API 入口）",[35,148,149],{},[56,150,151],{},"亮点：",[50,153,154,159,162,165,168,171,174],{},[53,155,156,158],{},[39,157,41],{}," 一行 5 分钟拉起 + 中文 UI 上手 0 摩擦",[53,160,161],{},"多 Key 轮询解决 OpenAI \u002F Anthropic 单 Key 限流",[53,163,164],{},"国内模型全 + 统一 OpenAI 接口，业务代码 0 修改切换",[53,166,167],{},"额度系统给每人发 token，成本归因清晰",[53,169,170],{},"new-api 仪表盘 + 缓存计费让 prompt caching 优化看得见",[53,172,173],{},"new-api 内置 EPay 支付对 B2B 中转站很方便",[53,175,176],{},"二次开发简单：Go 单仓 + 前端 React，加渠道 \u002F 改 logo 都不难",[35,178,179],{},[56,180,181],{},"踩坑：",[50,183,184,187,190,193,196,199,202,205],{},[53,185,186],{},"默认账号 root \u002F 123456 不改是大坑，公网暴露 = 资产被滥用",[53,188,189],{},"SQLite 版只适合个人 \u002F \u003C10 用户，团队 \u002F 生产必须 MySQL",[53,191,192],{},"文档以中文 README 为主，国际化弱",[53,194,195],{},"原版 one-api 缺多租户 + 缓存计费 + 仪表盘，生产几乎都得切 new-api",[53,197,198],{},"上游模型轮询时单点失败重试策略不如 LiteLLM 三类 fallback 细",[53,200,201],{},"高并发场景需要 Redis 配合做限流",[53,203,204],{},"部分上游厂商接口变更后需手动跟进升级",[53,206,207],{},"合规：未备案对外服务面临监管风险，企业内部用没问题",[30,209,211],{"id":210},"上手new-api-推荐","上手（new-api 推荐）",[213,214,219],"pre",{"className":215,"code":216,"language":217,"meta":218,"style":218},"language-bash shiki shiki-themes github-light github-dark","# MySQL 生产版\ndocker run --name new-api -d --restart always -p 3000:3000 \\\n  -e SQL_DSN=\"root:pass@tcp(host:3306)\u002Fnewapi\" \\\n  -e TZ=Asia\u002FShanghai \\\n  -v $PWD\u002Fdata:\u002Fdata \\\n  calciumion\u002Fnew-api:latest\n\n# 访问 http:\u002F\u002Flocalhost:3000\n# 1. 改 root 密码 + 关注册 + 加 IP 白名单\n# 2. 渠道管理 → 添加上游（OpenAI \u002F Anthropic \u002F DeepSeek Key）\n# 3. 设模型映射 + 倍率\n# 4. 用户管理 → 生成 token 给业务方\n# 5. 业务方调用：\n#    baseURL = https:\u002F\u002Fyour-domain\u002Fv1\n#    api_key = sk-xxx-from-newapi\n","bash","",[39,220,221,230,266,277,287,302,308,314,319,325,330,336,342,348,354],{"__ignoreMap":218},[222,223,226],"span",{"class":224,"line":225},"line",1,[222,227,229],{"class":228},"sJ8bj","# MySQL 生产版\n",[222,231,233,237,241,245,248,251,254,257,260,263],{"class":224,"line":232},2,[222,234,236],{"class":235},"sScJk","docker",[222,238,240],{"class":239},"sZZnC"," run",[222,242,244],{"class":243},"sj4cs"," --name",[222,246,247],{"class":239}," new-api",[222,249,250],{"class":243}," -d",[222,252,253],{"class":243}," --restart",[222,255,256],{"class":239}," always",[222,258,259],{"class":243}," -p",[222,261,262],{"class":239}," 3000:3000",[222,264,265],{"class":243}," \\\n",[222,267,269,272,275],{"class":224,"line":268},3,[222,270,271],{"class":243},"  -e",[222,273,274],{"class":239}," SQL_DSN=\"root:pass@tcp(host:3306)\u002Fnewapi\"",[222,276,265],{"class":243},[222,278,280,282,285],{"class":224,"line":279},4,[222,281,271],{"class":243},[222,283,284],{"class":239}," TZ=Asia\u002FShanghai",[222,286,265],{"class":243},[222,288,290,293,297,300],{"class":224,"line":289},5,[222,291,292],{"class":243},"  -v",[222,294,296],{"class":295},"sVt8B"," $PWD",[222,298,299],{"class":239},"\u002Fdata:\u002Fdata",[222,301,265],{"class":243},[222,303,305],{"class":224,"line":304},6,[222,306,307],{"class":239},"  calciumion\u002Fnew-api:latest\n",[222,309,310],{"class":224,"line":5},[222,311,313],{"emptyLinePlaceholder":312},true,"\n",[222,315,316],{"class":224,"line":8},[222,317,318],{"class":228},"# 访问 http:\u002F\u002Flocalhost:3000\n",[222,320,322],{"class":224,"line":321},9,[222,323,324],{"class":228},"# 1. 改 root 密码 + 关注册 + 加 IP 白名单\n",[222,326,327],{"class":224,"line":7},[222,328,329],{"class":228},"# 2. 渠道管理 → 添加上游（OpenAI \u002F Anthropic \u002F DeepSeek Key）\n",[222,331,333],{"class":224,"line":332},11,[222,334,335],{"class":228},"# 3. 设模型映射 + 倍率\n",[222,337,339],{"class":224,"line":338},12,[222,340,341],{"class":228},"# 4. 用户管理 → 生成 token 给业务方\n",[222,343,345],{"class":224,"line":344},13,[222,346,347],{"class":228},"# 5. 业务方调用：\n",[222,349,351],{"class":224,"line":350},14,[222,352,353],{"class":228},"#    baseURL = https:\u002F\u002Fyour-domain\u002Fv1\n",[222,355,357],{"class":224,"line":356},15,[222,358,359],{"class":228},"#    api_key = sk-xxx-from-newapi\n",[30,361,362],{"id":362},"对比",[364,365,366,387],"table",{},[367,368,369],"thead",{},[370,371,372,376,378,381,384],"tr",{},[373,374,375],"th",{},"维度",[373,377,11],{},[373,379,380],{},"new-api",[373,382,383],{},"LiteLLM",[373,385,386],{},"OpenRouter",[388,389,390,407,423,436,451,465,479,495,509,525],"tbody",{},[370,391,392,396,399,401,404],{},[393,394,395],"td",{},"语言",[393,397,398],{},"Go",[393,400,398],{},[393,402,403],{},"Python",[393,405,406],{},"–",[370,408,409,412,415,418,421],{},[393,410,411],{},"多租户",[393,413,414],{},"❌",[393,416,417],{},"✅",[393,419,420],{},"✅ (Enterprise)",[393,422,414],{},[370,424,425,428,430,432,434],{},[393,426,427],{},"缓存独立计费",[393,429,414],{},[393,431,417],{},[393,433,406],{},[393,435,406],{},[370,437,438,441,443,446,448],{},[393,439,440],{},"内置支付",[393,442,414],{},[393,444,445],{},"EPay \u002F Stripe",[393,447,414],{},[393,449,450],{},"❌（卡 + USDC）",[370,452,453,456,459,461,463],{},[393,454,455],{},"中文支付二开",[393,457,458],{},"✅ 易",[393,460,458],{},[393,462,406],{},[393,464,406],{},[370,466,467,470,472,474,477],{},[393,468,469],{},"中文 UI",[393,471,417],{},[393,473,417],{},[393,475,476],{},"英文",[393,478,476],{},[370,480,481,484,487,489,492],{},[393,482,483],{},"国内模型覆盖",[393,485,486],{},"✅ 全",[393,488,486],{},[393,490,491],{},"部分",[393,493,494],{},"中等",[370,496,497,500,502,504,506],{},[393,498,499],{},"Claude 原生格式",[393,501,414],{},[393,503,417],{},[393,505,417],{},[393,507,508],{},"OpenAI 兼容",[370,510,511,514,517,520,523],{},[393,512,513],{},"GitHub Star",[393,515,516],{},"18K+",[393,518,519],{},"增长快",[393,521,522],{},"高",[393,524,406],{},[370,526,527,530,533,535,538],{},[393,528,529],{},"部署难度",[393,531,532],{},"⭐",[393,534,532],{},[393,536,537],{},"⭐⭐",[393,539,406],{},[30,541,542],{"id":542},"避坑",[50,544,545,550,556,562,568,574,580,586,592],{},[53,546,547],{},[56,548,549],{},"第一件事改 root 密码 + 关公开注册 + 加 IP 白名单",[53,551,552,555],{},[56,553,554],{},"生产用 MySQL 不要 SQLite","：SQLite 并发上千就吃力",[53,557,558,561],{},[56,559,560],{},"加 Cloudflare CDN + WAF","：上游厂商风控会按出口 IP，扛不住会被拉黑",[53,563,564,567],{},[56,565,566],{},"渠道倍率别贪 0.1","：太低用户烧得快 + 上游被你做穿",[53,569,570,573],{},[56,571,572],{},"充值流水必须留痕","：EPay \u002F 自二开支付要符合发票 \u002F 反洗钱要求",[53,575,576,579],{},[56,577,578],{},"算法备案","：对中国境内公众提供生成式 AI 服务必须备案，否则违法",[53,581,582,585],{},[56,583,584],{},"上游条款","：OpenAI \u002F Anthropic \u002F 国内厂商基本都禁止未授权转售 API，自用 OK，商业化要拿合作授权",[53,587,588,591],{},[56,589,590],{},"缓存计费 (new-api)","：开 prompt caching 后单价不同，账单要看明细",[53,593,594,597],{},[56,595,596],{},"国内访问外网模型","：服务器要部署在能直连厂商的节点（如香港 \u002F 美西）+ 反向代理给国内用户",[30,599,601],{"id":600},"适合-不适合","适合 \u002F 不适合",[50,603,604,607,610,613,616,619,622,625,628],{},[53,605,606],{},"✅ 国内个人 \u002F 小团队自建 LLM 网关",[53,608,609],{},"✅ 企业内部统一多厂商 API 入口",[53,611,612],{},"✅ 学习 LLM 网关架构 \u002F 二次开发",[53,614,615],{},"✅ 国内模型 + 海外模型混用",[53,617,618],{},"✅ 中文运营 + 国内支付",[53,620,621],{},"❌ 微服务 \u002F 多语言客户端（走 LiteLLM）",[53,623,624],{},"❌ 不想运维（走 OpenRouter \u002F Portkey）",[53,626,627],{},"❌ 向中国境内公众提供未备案服务（违法）",[53,629,630],{},"❌ 国际化产品 \u002F 多语言文档需求",[30,632,633],{"id":633},"相关阅读",[50,635,636,642,647,652],{},[53,637,638],{},[639,640,641],"a",{"href":15},"LiteLLM 评测",[53,643,644],{},[639,645,646],{"href":18},"OpenRouter 评测",[53,648,649],{},[639,650,651],{"href":21},"Portkey 评测",[53,653,654],{},[639,655,656],{"href":24},"Helicone 评测",[30,658,659],{"id":659},"来源",[661,662,663,671,678,685],"ol",{},[53,664,665,666],{},"CSDN — One-API vs New-API 2026 选型与部署踩坑 ",[639,667,668],{"href":668,"rel":669},"https:\u002F\u002Fblog.csdn.net\u002Fofoxcoding\u002Farticle\u002Fdetails\u002F158886435",[670],"nofollow",[53,672,673,674],{},"DeepSeek 社区 — 2026 LLM API 中转站技术全景（含 new-api 增强能力对比表）",[639,675,676],{"href":676,"rel":677},"https:\u002F\u002Fdevpress.csdn.net\u002Fv1\u002Farticle\u002Fdetail\u002F161060038",[670],[53,679,680,681],{},"GitHub — songquanpeng\u002Fone-api ",[639,682,683],{"href":683,"rel":684},"https:\u002F\u002Fgithub.com\u002Fsongquanpeng\u002Fone-api",[670],[53,686,687,688],{},"GitHub — QuantumNous\u002Fnew-api ",[639,689,690],{"href":690,"rel":691},"https:\u002F\u002Fgithub.com\u002FQuantumNous\u002Fnew-api",[670],[693,694,695],"style",{},"html pre.shiki code .sJ8bj, html code.shiki .sJ8bj{--shiki-default:#6A737D;--shiki-dark:#6A737D}html pre.shiki code .sScJk, html code.shiki .sScJk{--shiki-default:#6F42C1;--shiki-dark:#B392F0}html pre.shiki code .sZZnC, html code.shiki .sZZnC{--shiki-default:#032F62;--shiki-dark:#9ECBFF}html pre.shiki code .sj4cs, html code.shiki .sj4cs{--shiki-default:#005CC5;--shiki-dark:#79B8FF}html pre.shiki code .sVt8B, html code.shiki .sVt8B{--shiki-default:#24292E;--shiki-dark:#E1E4E8}html .default .shiki span {color: var(--shiki-default);background: var(--shiki-default-bg);font-style: var(--shiki-default-font-style);font-weight: var(--shiki-default-font-weight);text-decoration: var(--shiki-default-text-decoration);}html .shiki span {color: var(--shiki-default);background: var(--shiki-default-bg);font-style: var(--shiki-default-font-style);font-weight: var(--shiki-default-font-weight);text-decoration: var(--shiki-default-text-decoration);}html .dark .shiki span {color: var(--shiki-dark);background: var(--shiki-dark-bg);font-style: var(--shiki-dark-font-style);font-weight: var(--shiki-dark-font-weight);text-decoration: var(--shiki-dark-text-decoration);}html.dark .shiki span {color: var(--shiki-dark);background: var(--shiki-dark-bg);font-style: var(--shiki-dark-font-style);font-weight: var(--shiki-dark-font-weight);text-decoration: var(--shiki-dark-text-decoration);}",{"title":218,"searchDepth":268,"depth":268,"links":697},[698,699,700,701,702,703,704,705,706,707],{"id":32,"depth":232,"text":33},{"id":48,"depth":232,"text":48},{"id":122,"depth":232,"text":122},{"id":145,"depth":232,"text":146},{"id":210,"depth":232,"text":211},{"id":362,"depth":232,"text":362},{"id":542,"depth":232,"text":542},{"id":600,"depth":232,"text":601},{"id":633,"depth":232,"text":633},{"id":659,"depth":232,"text":659},"api","\u002Fimg\u002Ftools\u002Fone-api.webp","One-API 真实评测：JustSong 维护的开源 LLM API 网关（GitHub 18K+ Star，Go 语言）。把 30+ 海内外厂商 API 统一成 OpenAI 格式，内置中文 UI + Key 管理 + 渠道分组 + 负载均衡 + 额度兑换 + IP 白名单 + 邀请返佣。`docker run` 一行起。衍生 new-api 增强多租户 \u002F 缓存计费 \u002F 内置 EPay 支付。",false,"md",[714,717,720,723],{"q":715,"a":716},"One-API 和 new-api 怎么选？","个人 \u002F 小团队内部用：one-api 已够。要做面向 B2B \u002F 商业化 \u002F 中文支付：new-api 多租户 + EPay\u002FStripe + 缓存独立计费 + 仪表盘更专业。new-api 是 one-api 二次开发版本，在生产场景已经全面超越原版。",{"q":718,"a":719},"支持哪些模型？","海外：OpenAI \u002F Anthropic Claude \u002F Google Gemini \u002F Mistral \u002F Groq \u002F Cohere \u002F xAI。国内：DeepSeek \u002F 通义千问 \u002F 文心一言 \u002F 讯飞星火 \u002F ChatGLM \u002F 豆包 \u002F 腾讯混元 \u002F 360 智脑 \u002F Moonshot \u002F 百川 \u002F MiniMax \u002F 零一万物 \u002F 阶跃星辰。本地：Ollama \u002F Cloudflare Workers AI。",{"q":721,"a":722},"默认密码记得改","Docker 拉起后默认账号 root \u002F 密码 123456。官方 README 已经反复警告但大量公开暴露的中转站连这一步都没做——上线前第一件事改密码 + 关注册 + 加 IP 白名单。",{"q":724,"a":725},"搭建中转站合规吗？","one-api \u002F new-api 本身是中立技术工具，合法场景：(1) 企业内部统一管理多厂商 API；(2) 个人学习研究；(3) 与上游签订正式合作的 B2B 服务。向中国境内公众提供生成式 AI 服务，依据《生成式人工智能服务管理暂行办法》必须完成算法备案 + 内容安全责任 + 投诉举报机制。未授权代理 \u002F 转售 OpenAI \u002F Anthropic API 违反上游条款。",[727,728],"zh","en",{},"\u002Ftools\u002Fcoding\u002Fapi\u002Fone-api","coding",[236,733,734],"linux","windows",[736,741],{"plan":737,"price":738,"features":739,"notes":740},"one-api（原版）","$0（MIT）","30+ 厂商统一 OpenAI 格式 + Key 管理 + 渠道分组 + 负载均衡 + 额度系统 + 多语言 UI","songquanpeng\u002Fone-api",{"plan":742,"price":743,"features":744,"notes":745},"new-api（增强版）","$0","原版 + 多租户 + 缓存计费 + 内置 EPay\u002FStripe + Discord\u002FTelegram\u002FLinuxDO 登录 + Claude\u002FGemini 原生格式","QuantumNous\u002Fnew-api","2026-06-19",[748],{"name":749,"url":750},"Claude Code 上手","\u002Fplaybook\u002Fonboarding\u002Fclaude-code-getting-started",{"power":279,"ux":279,"price":289,"cn_support":289,"stability":279},{"title":11,"description":710},"coding\u002Fapi\u002Fone-api",[755,758,760,762],{"name":756,"url":668,"accessed":757},"CSDN — One-API vs New-API 2026 选型与踩坑","2026-06-24",{"name":759,"url":676,"accessed":757},"DeepSeek 社区 — 2026 LLM API 中转站技术全景",{"name":761,"url":683,"accessed":757},"GitHub — songquanpeng\u002Fone-api",{"name":763,"url":690,"accessed":757},"GitHub — QuantumNous\u002Fnew-api","tools\u002Fcoding\u002Fapi\u002Fone-api","国内最流行的开源 LLM 网关——Go + Docker 一键起，30+ 厂商统一 OpenAI 格式，中文 UI + 充值系统",[767,768,769,770,771,772,773],"llm-gateway","opensource","mit","chinese","go","openai-compatible","self-host","国内开发者自建 LLM 网关首选——中文 UI + 国内模型全 + EPay 支付。海外团队 \u002F 多语言客户端 \u002F 微服务架构走 LiteLLM；面向中国境内公众提供服务需依法备案。","_7HhOvUdakEn-dUR9ynTfAieeAqkfQZ7pnT8O55Rn9Q",{"ok":312,"slug":777,"viewCount":778,"clickCount":778,"avgRating":778,"ratingCount":778},"coding%2Fapi%2Fone-api",0,[780,1541,2278,2783,3306],{"id":781,"title":782,"alternatives":783,"api_compatible":25,"body":789,"category":708,"chinese_friendly":232,"cover":1474,"description":1475,"domestic":711,"extension":712,"faq":1476,"free":711,"github":25,"languages":1489,"meta":1490,"models":25,"navigation":312,"notSuitable":25,"opensource":312,"path":24,"pillar":731,"platforms":1491,"priceTable":1494,"pricing":1510,"published":746,"relatedPlaybooks":1511,"relatedReviews":25,"score":1515,"self_host":312,"seo":1516,"slug":1517,"sources":1518,"stem":1529,"suitable":25,"tagline":1530,"tags":1531,"updated":757,"verdict":1538,"website":1539,"__hash__":1540},"tools\u002Ftools\u002Fcoding\u002Fapi\u002Fhelicone.md","Helicone",[784,785,786,787],{"name":20,"url":21},{"name":14,"url":15},{"name":17,"url":18},{"name":788,"url":730},"one-api",{"type":27,"value":790,"toc":1462},[791,793,796,799,801,879,881,907,912,916,920,943,947,973,976,1103,1146,1148,1316,1318,1368,1370,1399,1401,1420,1422,1459],[30,792,33],{"id":32},[35,794,795],{},"Helicone 是 YC W23 出身的开源 LLM 观测平台，主打『一行代码接入』：改 baseURL，立刻看到 cost \u002F latency \u002F errors \u002F token 详情。背后还有 Rust 写的 AI Gateway，路由 100+ 模型 + 缓存 + fallback + 限流。2026-03-03 被 Mintlify 收购后转维护模式（安全 patch + 新模型 + bug fix 继续，主动新功能停）。Hobby 免费 10K req\u002F月，Pro $79，Team $799（SOC2 + HIPAA），Enterprise 定制。SOC2 + GDPR 合规，可 Docker \u002F Kubernetes 自托管。",[35,797,798],{},"适合：要 5 分钟接入 LLM 观测的小团队 \u002F 早期产品；改 baseURL 模式想看 cost \u002F latency 即可；预算紧 → Hobby 10K 免费 + 自托管 OSS。不适合：复杂 agent 调试需要 nested span（Langfuse）；要 250+ 模型 \u002F MCP Gateway \u002F 治理（Portkey）；担心维护模式带来的路线图风险（Mintlify 收购后主动开发结束）。",[30,800,48],{"id":48},[50,802,803,809,815,821,827,832,838,844,849,855,861,867,873],{},[53,804,805,808],{},[56,806,807],{},"Proxy 模式","：改 baseURL，零 SDK 改造",[53,810,811,814],{},[56,812,813],{},"Async 模式","：SDK 异步上报，0 延迟 + 容错",[53,816,817,820],{},[56,818,819],{},"Request logging","：每条请求 + 响应 + cost + token + latency",[53,822,823,826],{},[56,824,825],{},"Custom properties + sessions","：把多步工作流分组看",[53,828,829],{},[56,830,831],{},"Prompt management + playground",[53,833,834,837],{},[56,835,836],{},"Custom scoring","：基础打分 + 数据集",[53,839,840,843],{},[56,841,842],{},"AI Gateway","（Rust 写）：100+ 模型 + caching + fallback + rate limit",[53,845,846],{},[56,847,848],{},"OpenAI \u002F Anthropic \u002F Azure \u002F LiteLLM \u002F Anyscale \u002F Together \u002F OpenRouter 集成",[53,850,851,854],{},[56,852,853],{},"Trace API","：手动 POST 多步 trace 数据（弥补 proxy 看不到 agent 内部）",[53,856,857,860],{},[56,858,859],{},"Dashboard API","：查 dashboard 数据",[53,862,863,866],{},[56,864,865],{},"Self-host","：Docker \u002F Kubernetes，开源 MIT",[53,868,869,872],{},[56,870,871],{},"合规","：SOC 2 + GDPR；Team+ HIPAA",[53,874,875,878],{},[56,876,877],{},"导出","：webhook + 外部 reporting",[30,880,122],{"id":122},[50,882,883,889,895,901],{},[53,884,885,888],{},[56,886,887],{},"Hobby","：$0 \u002F 10K req\u002F月 \u002F 7 天 retention \u002F 1 seat \u002F 1GB 存储",[53,890,891,894],{},[56,892,893],{},"Pro","：$79\u002F月 \u002F 10K 起 + usage \u002F 1 月 retention \u002F unlimited seats \u002F alerts \u002F HQL",[53,896,897,900],{},[56,898,899],{},"Team","：$799\u002F月 \u002F 10K 起 + usage \u002F 3 月 retention \u002F SOC 2 + HIPAA \u002F 5 orgs",[53,902,903,906],{},[56,904,905],{},"Enterprise","：Custom \u002F 自定义 retention \u002F 永久存储 \u002F SSO \u002F on-prem",[138,908,909],{},[35,910,911],{},"自托管版（OSS）= $0 + 无限 logs，但运维 \u002F Postgres \u002F Clickhouse 全要自己搞。",[30,913,915],{"id":914},"实测早期-saas-5-人团队","实测（早期 SaaS \u002F 5 人团队）",[35,917,918],{},[56,919,151],{},[50,921,922,925,928,931,934,937,940],{},[53,923,924],{},"5 分钟接入，OpenAI SDK 改 baseURL + 加 Helicone-Auth header",[53,926,927],{},"Dashboard 看 cost \u002F latency \u002F error 第一天就帮发现 prompt 失控",[53,929,930],{},"Custom properties 给每个 user \u002F feature 打标，分摊成本清晰",[53,932,933],{},"Sessions 把 multi-step workflow 串起来（不像 Langfuse 是真 trace，但够小项目用）",[53,935,936],{},"AI Gateway 给 fallback \u002F caching 一站式提供",[53,938,939],{},"开源自托管对预算紧团队是真救命",[53,941,942],{},"与 LiteLLM 集成顺滑",[35,944,945],{},[56,946,181],{},[50,948,949,952,955,958,961,964,967,970],{},[53,950,951],{},"2026-03 被 Mintlify 收购转维护模式后，主动功能开发停，长期路线图不确定",[53,953,954],{},"Proxy 模式 5–20ms 延迟在高 QPS 场景叠加可观",[53,956,957],{},"Proxy 看不到 agent 内部 tool \u002F sub-agent \u002F retries——复杂 agent 调试不够",[53,959,960],{},"Custom scoring 浅，不如 Langfuse 的 LLM-as-judge + 数据集 eval 体系完整",[53,962,963],{},"Free tier 10K req 小型生产几天就用完",[53,965,966],{},"文档自 Mintlify 收购后部分整合到 Mintlify Docs，导航变化",[53,968,969],{},"中文场景体验有限",[53,971,972],{},"Prompt caching 需要 cache-aware prompt design（含 timestamp \u002F nonce 命中率为 0）",[30,974,975],{"id":975},"上手",[213,977,981],{"className":978,"code":979,"language":980,"meta":218,"style":218},"language-python shiki shiki-themes github-light github-dark","# Proxy 模式\nimport openai\nclient = openai.OpenAI(\n    base_url=\"https:\u002F\u002Foai.helicone.ai\u002Fv1\",\n    api_key=OPENAI_KEY,\n    default_headers={\n        \"Helicone-Auth\": f\"Bearer {HELICONE_KEY}\",\n        \"Helicone-User-Id\": \"user_123\",\n        \"Helicone-Property-Feature\": \"summarize\"\n    }\n)\n# 立刻在 https:\u002F\u002Fus.helicone.ai 看到 cost \u002F latency \u002F log\n","python",[39,982,983,988,997,1008,1022,1034,1044,1066,1078,1088,1093,1098],{"__ignoreMap":218},[222,984,985],{"class":224,"line":225},[222,986,987],{"class":228},"# Proxy 模式\n",[222,989,990,994],{"class":224,"line":232},[222,991,993],{"class":992},"szBVR","import",[222,995,996],{"class":295}," openai\n",[222,998,999,1002,1005],{"class":224,"line":268},[222,1000,1001],{"class":295},"client ",[222,1003,1004],{"class":992},"=",[222,1006,1007],{"class":295}," openai.OpenAI(\n",[222,1009,1010,1014,1016,1019],{"class":224,"line":279},[222,1011,1013],{"class":1012},"s4XuR","    base_url",[222,1015,1004],{"class":992},[222,1017,1018],{"class":239},"\"https:\u002F\u002Foai.helicone.ai\u002Fv1\"",[222,1020,1021],{"class":295},",\n",[222,1023,1024,1027,1029,1032],{"class":224,"line":289},[222,1025,1026],{"class":1012},"    api_key",[222,1028,1004],{"class":992},[222,1030,1031],{"class":243},"OPENAI_KEY",[222,1033,1021],{"class":295},[222,1035,1036,1039,1041],{"class":224,"line":304},[222,1037,1038],{"class":1012},"    default_headers",[222,1040,1004],{"class":992},[222,1042,1043],{"class":295},"{\n",[222,1045,1046,1049,1052,1055,1058,1061,1064],{"class":224,"line":5},[222,1047,1048],{"class":239},"        \"Helicone-Auth\"",[222,1050,1051],{"class":295},": ",[222,1053,1054],{"class":992},"f",[222,1056,1057],{"class":239},"\"Bearer ",[222,1059,1060],{"class":243},"{HELICONE_KEY}",[222,1062,1063],{"class":239},"\"",[222,1065,1021],{"class":295},[222,1067,1068,1071,1073,1076],{"class":224,"line":8},[222,1069,1070],{"class":239},"        \"Helicone-User-Id\"",[222,1072,1051],{"class":295},[222,1074,1075],{"class":239},"\"user_123\"",[222,1077,1021],{"class":295},[222,1079,1080,1083,1085],{"class":224,"line":321},[222,1081,1082],{"class":239},"        \"Helicone-Property-Feature\"",[222,1084,1051],{"class":295},[222,1086,1087],{"class":239},"\"summarize\"\n",[222,1089,1090],{"class":224,"line":7},[222,1091,1092],{"class":295},"    }\n",[222,1094,1095],{"class":224,"line":332},[222,1096,1097],{"class":295},")\n",[222,1099,1100],{"class":224,"line":338},[222,1101,1102],{"class":228},"# 立刻在 https:\u002F\u002Fus.helicone.ai 看到 cost \u002F latency \u002F log\n",[213,1104,1106],{"className":215,"code":1105,"language":217,"meta":218,"style":218},"# 自托管\ngit clone https:\u002F\u002Fgithub.com\u002FHelicone\u002Fhelicone\ncd helicone && docker compose up -d\n",[39,1107,1108,1113,1124],{"__ignoreMap":218},[222,1109,1110],{"class":224,"line":225},[222,1111,1112],{"class":228},"# 自托管\n",[222,1114,1115,1118,1121],{"class":224,"line":232},[222,1116,1117],{"class":235},"git",[222,1119,1120],{"class":239}," clone",[222,1122,1123],{"class":239}," https:\u002F\u002Fgithub.com\u002FHelicone\u002Fhelicone\n",[222,1125,1126,1129,1132,1135,1137,1140,1143],{"class":224,"line":268},[222,1127,1128],{"class":243},"cd",[222,1130,1131],{"class":239}," helicone",[222,1133,1134],{"class":295}," && ",[222,1136,236],{"class":235},[222,1138,1139],{"class":239}," compose",[222,1141,1142],{"class":239}," up",[222,1144,1145],{"class":243}," -d\n",[30,1147,362],{"id":362},[364,1149,1150,1164],{},[367,1151,1152],{},[370,1153,1154,1156,1158,1161],{},[373,1155,375],{},[373,1157,782],{},[373,1159,1160],{},"Langfuse",[373,1162,1163],{},"Portkey",[388,1165,1166,1180,1193,1207,1220,1234,1248,1261,1274,1288,1302],{},[370,1167,1168,1171,1174,1177],{},[393,1169,1170],{},"架构",[393,1172,1173],{},"Proxy \u002F Async",[393,1175,1176],{},"SDK",[393,1178,1179],{},"Gateway",[370,1181,1182,1185,1188,1191],{},[393,1183,1184],{},"接入时间",[393,1186,1187],{},"分钟（改 URL）",[393,1189,1190],{},"小时（代码改造）",[393,1192,1187],{},[370,1194,1195,1198,1201,1204],{},[393,1196,1197],{},"Tracing 深度",[393,1199,1200],{},"浅（请求级）",[393,1202,1203],{},"✅ 深 nested",[393,1205,1206],{},"中",[370,1208,1209,1212,1215,1217],{},[393,1210,1211],{},"Multi-provider routing",[393,1213,1214],{},"✅ 基础 fallback",[393,1216,414],{},[393,1218,1219],{},"✅ 250+",[370,1221,1222,1225,1228,1231],{},[393,1223,1224],{},"Prompt mgmt",[393,1226,1227],{},"playground + 基础版本",[393,1229,1230],{},"✅ 版本 + playground",[393,1232,1233],{},"模板 + 管理",[370,1235,1236,1239,1242,1245],{},[393,1237,1238],{},"Eval",[393,1240,1241],{},"基础 scoring",[393,1243,1244],{},"✅ LLM-as-judge + datasets",[393,1246,1247],{},"基础",[370,1249,1250,1252,1255,1258],{},[393,1251,865],{},[393,1253,1254],{},"✅ OSS 完整",[393,1256,1257],{},"✅ MIT 19K+ stars",[393,1259,1260],{},"OSS Gateway only",[370,1262,1263,1265,1268,1271],{},[393,1264,871],{},[393,1266,1267],{},"SOC2 + HIPAA (Team+)",[393,1269,1270],{},"SOC2 (Enterprise)",[393,1272,1273],{},"SOC2 + HIPAA + ISO27001",[370,1275,1276,1279,1282,1285],{},[393,1277,1278],{},"Free tier",[393,1280,1281],{},"10K req\u002F月",[393,1283,1284],{},"50K events\u002F月",[393,1286,1287],{},"10K logs\u002F月",[370,1289,1290,1293,1296,1299],{},[393,1291,1292],{},"Paid 起价",[393,1294,1295],{},"$79",[393,1297,1298],{},"$29",[393,1300,1301],{},"$49",[370,1303,1304,1307,1310,1313],{},[393,1305,1306],{},"路线图",[393,1308,1309],{},"⚠️ 维护模式",[393,1311,1312],{},"✅ 活跃",[393,1314,1315],{},"✅ 活跃（PANW 收购）",[30,1317,542],{"id":542},[50,1319,1320,1326,1332,1338,1344,1350,1356,1362],{},[53,1321,1322,1325],{},[56,1323,1324],{},"维护模式风险","：被 Mintlify 收购后主动开发停，新项目长期演进考虑 Langfuse \u002F Portkey",[53,1327,1328,1331],{},[56,1329,1330],{},"Proxy 延迟 + SPOF","：Helicone 挂了，业务也挂；敏感链路用 async",[53,1333,1334,1337],{},[56,1335,1336],{},"Proxy 看不到 agent 内部","：tool call \u002F sub-agent \u002F retries 不可见，复杂 agent 用 Trace API 或转 Langfuse",[53,1339,1340,1343],{},[56,1341,1342],{},"Hobby 10K 跑不久","：小型生产几天用完，预算够直接上 Pro",[53,1345,1346,1349],{},[56,1347,1348],{},"Cache-aware prompt 设计","：prompt 含 timestamp \u002F random nonce 命中率 = 0",[53,1351,1352,1355],{},[56,1353,1354],{},"Custom scoring 浅","：复杂 eval 用 Langfuse 数据集 + LLM-as-judge",[53,1357,1358,1361],{},[56,1359,1360],{},"Air-gapped 价格","：自托管时部分模型价格表要手动维护",[53,1363,1364,1367],{},[56,1365,1366],{},"PII 路径敏感","：所有 prompt 经过 Helicone，要 review PII 处理 + retention + 自托管选项",[30,1369,601],{"id":600},[50,1371,1372,1375,1378,1381,1384,1387,1390,1393,1396],{},[53,1373,1374],{},"✅ 早期产品 + 想 5 分钟接入观测",[53,1376,1377],{},"✅ 改 baseURL 模式偏好 \u002F 不想 SDK 改造",[53,1379,1380],{},"✅ 预算紧 + 自托管接受",[53,1382,1383],{},"✅ 想用 Rust AI Gateway 做 fallback + caching",[53,1385,1386],{},"✅ SOC2 \u002F HIPAA Team+ 合规",[53,1388,1389],{},"❌ 复杂 agent 多步骤调试（用 Langfuse）",[53,1391,1392],{},"❌ 要 250+ 模型 + MCP + 强治理（用 Portkey）",[53,1394,1395],{},"❌ 长期路线图敏感（维护模式 risk）",[53,1397,1398],{},"❌ 中文运营（社区 \u002F 文档 \u002F UI 均英文）",[30,1400,633],{"id":633},[50,1402,1403,1407,1411,1415],{},[53,1404,1405],{},[639,1406,651],{"href":21},[53,1408,1409],{},[639,1410,641],{"href":15},[53,1412,1413],{},[639,1414,646],{"href":18},[53,1416,1417],{},[639,1418,1419],{"href":730},"One-API 评测",[30,1421,659],{"id":659},[661,1423,1424,1431,1438,1445,1452],{},[53,1425,1426,1427],{},"Inference.net — Helicone Pricing & Alternatives 2026（含 Mintlify 收购 + 维护模式细节）",[639,1428,1429],{"href":1429,"rel":1430},"https:\u002F\u002Finference.net\u002Fcontent\u002Fhelicone-pricing-alternatives",[670],[53,1432,1433,1434],{},"Helicone 官网 ",[639,1435,1436],{"href":1436,"rel":1437},"https:\u002F\u002Fwww.helicone.ai\u002F",[670],[53,1439,1440,1441],{},"QASkills — Helicone LLM Monitoring Complete Guide 2026 ",[639,1442,1443],{"href":1443,"rel":1444},"https:\u002F\u002Fqaskills.sh\u002Fblog\u002Fhelicone-llm-monitoring-complete-guide",[670],[53,1446,1447,1448],{},"AiPedia — Helicone Features Pricing & Failure Modes ",[639,1449,1450],{"href":1450,"rel":1451},"https:\u002F\u002Fwww.aipedia.wiki\u002Ftools\u002Fhelicone\u002F",[670],[53,1453,1454,1455],{},"BuildMVPFast — Langfuse vs Helicone vs Portkey ",[639,1456,1457],{"href":1457,"rel":1458},"https:\u002F\u002Fwww.buildmvpfast.com\u002Fblog\u002Fllm-observability-stack-langfuse-helicone-portkey-2026",[670],[693,1460,1461],{},"html pre.shiki code .sJ8bj, html code.shiki .sJ8bj{--shiki-default:#6A737D;--shiki-dark:#6A737D}html pre.shiki code .sScJk, html code.shiki .sScJk{--shiki-default:#6F42C1;--shiki-dark:#B392F0}html pre.shiki code .sZZnC, html code.shiki .sZZnC{--shiki-default:#032F62;--shiki-dark:#9ECBFF}html pre.shiki code .sj4cs, html code.shiki .sj4cs{--shiki-default:#005CC5;--shiki-dark:#79B8FF}html pre.shiki code .sVt8B, html code.shiki .sVt8B{--shiki-default:#24292E;--shiki-dark:#E1E4E8}html .default .shiki span {color: var(--shiki-default);background: var(--shiki-default-bg);font-style: var(--shiki-default-font-style);font-weight: var(--shiki-default-font-weight);text-decoration: var(--shiki-default-text-decoration);}html .shiki span {color: var(--shiki-default);background: var(--shiki-default-bg);font-style: var(--shiki-default-font-style);font-weight: var(--shiki-default-font-weight);text-decoration: var(--shiki-default-text-decoration);}html .dark .shiki span {color: var(--shiki-dark);background: var(--shiki-dark-bg);font-style: var(--shiki-dark-font-style);font-weight: var(--shiki-dark-font-weight);text-decoration: var(--shiki-dark-text-decoration);}html.dark .shiki span {color: var(--shiki-dark);background: var(--shiki-dark-bg);font-style: var(--shiki-dark-font-style);font-weight: var(--shiki-dark-font-weight);text-decoration: var(--shiki-dark-text-decoration);}html pre.shiki code .szBVR, html code.shiki .szBVR{--shiki-default:#D73A49;--shiki-dark:#F97583}html pre.shiki code .s4XuR, html code.shiki .s4XuR{--shiki-default:#E36209;--shiki-dark:#FFAB70}",{"title":218,"searchDepth":268,"depth":268,"links":1463},[1464,1465,1466,1467,1468,1469,1470,1471,1472,1473],{"id":32,"depth":232,"text":33},{"id":48,"depth":232,"text":48},{"id":122,"depth":232,"text":122},{"id":914,"depth":232,"text":915},{"id":975,"depth":232,"text":975},{"id":362,"depth":232,"text":362},{"id":542,"depth":232,"text":542},{"id":600,"depth":232,"text":601},{"id":633,"depth":232,"text":633},{"id":659,"depth":232,"text":659},"\u002Fimg\u002Ftools\u002Fhelicone.webp","Helicone 真实评测：YC W23 项目，开源 LLM 观测平台 + Rust 写的 AI Gateway。2026-03-03 被 Mintlify 收购后转维护模式（安全更新 + 新模型 + bug fix 继续，主动新功能停）。免费 10K req\u002F月 + Pro $79 + Team $799（SOC2 + HIPAA）+ Enterprise 定制。零代码 SDK 改造、改 baseURL 即用，是接入最快的 LLM 观测之一。",[1477,1480,1483,1486],{"q":1478,"a":1479},"Helicone 被收购后还能用吗？","2026-03-03 Mintlify 收购 Helicone，产品转维护模式：安全 patch + 新模型支持 + bug fix 继续发，但主动新功能开发结束。现存生产部署仍稳定，但选型时要权衡：路线图不动 \u002F 不期待新观测形态 \u002F 接受工具被 Mintlify 整合或归档的风险。新项目长期演进建议看 Langfuse 或 Portkey。",{"q":1481,"a":1482},"Proxy 和 async 模式哪个好？","Proxy（改 baseURL，所有请求走 Helicone）= 接入快 + 完整捕获，但加 ~5–20ms 延迟、Helicone 挂了请求也挂。Async（SDK 异步上报）= 0 延迟 + Helicone 故障不影响业务，但失败窗口可能漏 log。生产敏感链路用 async，开发 \u002F 内部用 proxy。",{"q":1484,"a":1485},"Proxy 能看到 agent 内部工具调用吗？","不能——proxy 只能看到穿过它的 LLM 请求，agent 框架内的 tool execution \u002F sub-agent \u002F retries 都不可见。复杂 agent 调试需要 trace 级深度，要 Langfuse 的 nested span 或 Helicone Trace API（手动 POST）。",{"q":1487,"a":1488},"和 Langfuse \u002F Portkey 怎么选？","Helicone = proxy-based，URL 一改分钟上手，请求级日志 + 基础 gateway 路由。Langfuse = SDK-based，代码改造小时级，但 nested span 深度 tracing + LLM-as-judge eval 一等。Portkey = gateway-first，250+ 模型 + MCP + 强合规但定价复杂。简单 + 快 → Helicone；agent 调试 → Langfuse；网关 + 治理 + 合规 → Portkey。",[728],{},[1492,773,708,1493],"saas","sdk",[1495,1498,1502,1506],{"plan":887,"price":743,"features":1496,"notes":1497},"10K req\u002F月 + 7 天 retention + 1 seat + 1GB storage + 基础 dashboards","Free trial \u002F hobby \u002F 验证",{"plan":893,"price":1499,"features":1500,"notes":1501},"$79\u002F月","10K + usage + 1 月 retention + unlimited seats + alerts + HQL + prompt management","中小生产",{"plan":899,"price":1503,"features":1504,"notes":1505},"$799\u002F月","10K + usage + 3 月 retention + SOC-2 + HIPAA + 5 orgs","中大型 + 合规",{"plan":905,"price":1507,"features":1508,"notes":1509},"Custom","自定义 retention + 永久存储 + SSO + on-prem + 专属支持","大型 \u002F 政企","Hobby 免费 10K req\u002F月 \u002F Pro $79\u002F月 \u002F Team $799\u002F月 \u002F Enterprise 定制",[1512],{"name":1513,"url":1514},"RAG Pipeline 搭建","\u002Fplaybook\u002Fonboarding\u002Frag-pipeline-build",{"power":279,"ux":289,"price":279,"cn_support":232,"stability":268},{"title":782,"description":1475},"coding\u002Fapi\u002Fhelicone",[1519,1521,1523,1525,1527],{"name":1520,"url":1429,"accessed":757},"Inference.net — Helicone Pricing & Alternatives (Jun 2026)",{"name":1522,"url":1436,"accessed":757},"Helicone 官网",{"name":1524,"url":1443,"accessed":757},"QASkills — Helicone LLM Monitoring Guide 2026",{"name":1526,"url":1450,"accessed":757},"AiPedia — Helicone 评测 + 失败模式",{"name":1528,"url":1457,"accessed":757},"BuildMVPFast — Langfuse vs Helicone vs Portkey","tools\u002Fcoding\u002Fapi\u002Fhelicone","一行代码 LLM 观测——开源 Proxy + AI Gateway，2026-03 被 Mintlify 收购、维护模式运行",[1532,1533,1534,768,1535,1536,1537],"llm-observability","proxy","ai-gateway","ycombinator","soc2","hipaa","最容易接入的 LLM 观测，改 baseURL 几分钟看到 cost\u002Flatency\u002Ferrors。被 Mintlify 收购转维护模式后路线图不确定——做新项目权衡：要快上手 + 不期待新功能 OK；要 nested span + 持续演进走 Langfuse。","https:\u002F\u002Fwww.helicone.ai","GpJw1egdrEqix3JjRYdBYL5A5B8QlfscDzrOy_gnWYE",{"id":1542,"title":383,"alternatives":1543,"api_compatible":25,"body":1548,"category":708,"chinese_friendly":268,"cover":2227,"description":2228,"domestic":711,"extension":712,"faq":2229,"free":711,"github":25,"languages":2242,"meta":2243,"models":25,"navigation":312,"notSuitable":25,"opensource":312,"path":15,"pillar":731,"platforms":2244,"priceTable":2246,"pricing":2254,"published":746,"relatedPlaybooks":2255,"relatedReviews":25,"score":2257,"self_host":312,"seo":2258,"slug":2259,"sources":2260,"stem":2269,"suitable":25,"tagline":2270,"tags":2271,"updated":757,"verdict":2275,"website":2276,"__hash__":2277},"tools\u002Ftools\u002Fcoding\u002Fapi\u002Flitellm.md",[1544,1545,1546,1547],{"name":17,"url":18},{"name":788,"url":730},{"name":20,"url":21},{"name":23,"url":24},{"type":27,"value":1549,"toc":2215},[1550,1552,1559,1562,1564,1660,1662,1678,1683,1687,1691,1714,1718,1743,1747,1915,1917,2067,2069,2133,2135,2160,2162,2180,2182,2212],[30,1551,33],{"id":32},[35,1553,1554,1555,1558],{},"LiteLLM 是开源 LLM 网关里事实标准：MIT 协议，BerriAI 维护，双形态——SDK（",[39,1556,1557],{},"pip install","，单进程嵌入）+ Proxy（Docker Compose + Postgres，团队级网关）。100+ 厂商统一 OpenAI 接口，虚拟 Key + 团队预算 + 三类 fallback（错误\u002F政策\u002F上下文）+ 成本追踪 + 内置 admin UI。2026-03 供应链事件后 v1.83+ 强化镜像验证，生产固定签名版本。",[35,1560,1561],{},"适合：中大型团队 \u002F 合规 \u002F 想完全控数据 + BYOK；微服务架构需要语言无关的 OpenAI 网关；要把成本治理 + 观测做到自建。不适合：不想运维（SaaS 走 OpenRouter \u002F Portkey）；中文支付 \u002F 业务运营（走 one-api \u002F new-api）；纯个人项目（pip 装 SDK 已够，不需要 Proxy）。",[30,1563,48],{"id":48},[50,1565,1566,1572,1581,1591,1600,1609,1615,1621,1630,1636,1642,1648,1654],{},[53,1567,1568,1571],{},[56,1569,1570],{},"100+ providers","：OpenAI \u002F Anthropic \u002F Google \u002F AWS Bedrock \u002F Azure \u002F vLLM \u002F Ollama \u002F Together \u002F HuggingFace 等",[53,1573,1574,1577,1578],{},[56,1575,1576],{},"统一 OpenAI 接口","：所有模型走 ",[39,1579,1580],{},"\u002Fv1\u002Fchat\u002Fcompletions",[53,1582,1583,1586,1587,1590],{},[56,1584,1585],{},"SDK 模式","：",[39,1588,1589],{},"from litellm import completion","，适合嵌入",[53,1592,1593,1595,1596,1599],{},[56,1594,807],{},"：HTTP 服务 + Postgres + admin UI（",[39,1597,1598],{},"\u002Fui","）",[53,1601,1602,1586,1605,1608],{},[56,1603,1604],{},"虚拟 Key",[39,1606,1607],{},"\u002Fkey\u002Fgenerate"," 给团队 \u002F 服务签发独立 Key + 预算 + 模型白名单",[53,1610,1611,1614],{},[56,1612,1613],{},"三类 fallback","：错误 \u002F 内容政策 \u002F context window",[53,1616,1617,1620],{},[56,1618,1619],{},"重试 + 超时 + cooldown","：完整 SRE 配套",[53,1622,1623,1586,1626,1629],{},[56,1624,1625],{},"Cost tracking",[39,1627,1628],{},"\u002Fglobal\u002Fspend\u002Freport"," + admin UI 看每团队 \u002F Key \u002F 模型成本",[53,1631,1632,1635],{},[56,1633,1634],{},"回调","：Langfuse \u002F Prometheus \u002F Slack 一键挂载",[53,1637,1638,1641],{},[56,1639,1640],{},"Guardrails","：Presidio PII masking \u002F 自定义内容检查",[53,1643,1644,1647],{},[56,1645,1646],{},"缓存","：Redis 内置 + 语义缓存",[53,1649,1650,1653],{},[56,1651,1652],{},"Routing strategy","：cost-based \u002F latency-based \u002F round-robin",[53,1655,1656,1659],{},[56,1657,1658],{},"MIT 协议","：完全自由商用 + 修改",[30,1661,122],{"id":122},[50,1663,1664,1670,1675],{},[53,1665,1666,1669],{},[56,1667,1668],{},"OSS","：$0；自托管成本 = 1 台 Postgres + 1 台 LiteLLM container（~2GB RAM）",[53,1671,1672,1674],{},[56,1673,905],{},"：Custom；SSO \u002F SAML \u002F 审计 \u002F SLA \u002F on-prem 部署支持",[53,1676,1677],{},"模型成本走各厂商直接结算（BYOK）",[138,1679,1680],{},[35,1681,1682],{},"小规模总成本：1 台 2 核 4G VPS 跑 Postgres + LiteLLM 月 $20–30，团队 10 人完全够。",[30,1684,1686],{"id":1685},"实测10-人-saas-微服务架构","实测（10 人 SaaS \u002F 微服务架构）",[35,1688,1689],{},[56,1690,151],{},[50,1692,1693,1696,1699,1702,1705,1708,1711],{},[53,1694,1695],{},"Docker Compose 40 分钟拉起完整生产栈",[53,1697,1698],{},"虚拟 Key + 预算让微服务团队成本归因清晰",[53,1700,1701],{},"三类 fallback 配齐后可用率从 99.2% → 99.8%",[53,1703,1704],{},"admin UI 看每团队每天成本省了一堆自研 dashboard",[53,1706,1707],{},"Postgres + master key 模式，密钥 + 配置一致性高",[53,1709,1710],{},"与 Langfuse 集成做 trace + cost 双视角",[53,1712,1713],{},"多语言客户端（Python \u002F Node \u002F Go \u002F Rust）走同一 endpoint 体验一致",[35,1715,1716],{},[56,1717,181],{},[50,1719,1720,1727,1730,1733,1740],{},[53,1721,1722,1723,1726],{},"2026-03 供应链事件让团队对 ",[39,1724,1725],{},":latest"," tag 警惕，生产必须固定签名版本（如 v1.85.0）",[53,1728,1729],{},"Postgres salt key 一旦生成不能轮换，初始化前要谨慎备份",[53,1731,1732],{},"admin UI 早期版本英文为主，中文文档少",[53,1734,1735,1736,1739],{},"模型 ID 命名复杂（",[39,1737,1738],{},"provider\u002Fmodel-name","），各厂商命名规则不一",[53,1741,1742],{},"自托管 = 自付运维（Postgres backup \u002F 升级 \u002F 监控）",[30,1744,1746],{"id":1745},"上手proxy-模式","上手（Proxy 模式）",[213,1748,1750],{"className":215,"code":1749,"language":217,"meta":218,"style":218},"mkdir llm-gateway && cd llm-gateway\nopenssl rand -hex 32 > .master_key\nopenssl rand -hex 32 > .salt_key\n\n# docker-compose.yml 拉 ghcr.io\u002Fberriai\u002Flitellm:v1.85.0\n# config.yaml 写 model_list \u002F fallbacks \u002F litellm_settings\n\ndocker compose up -d\n\n# 生成虚拟 Key\ncurl -X POST http:\u002F\u002Flocalhost:4000\u002Fkey\u002Fgenerate \\\n  -H \"Authorization: Bearer $LITELLM_MASTER_KEY\" \\\n  -d '{\"models\":[\"gpt-5.4\",\"claude-sonnet-4.6\"],\"max_budget\":100}'\n\n# 业务方调用\ncurl http:\u002F\u002Flocalhost:4000\u002Fv1\u002Fchat\u002Fcompletions \\\n  -H \"Authorization: Bearer sk-xxx\" \\\n  -d '{\"model\":\"gpt-5.4\",\"messages\":[...]}'\n",[39,1751,1752,1767,1787,1802,1806,1811,1816,1820,1830,1834,1839,1855,1870,1878,1882,1887,1897,1907],{"__ignoreMap":218},[222,1753,1754,1757,1760,1762,1764],{"class":224,"line":225},[222,1755,1756],{"class":235},"mkdir",[222,1758,1759],{"class":239}," llm-gateway",[222,1761,1134],{"class":295},[222,1763,1128],{"class":243},[222,1765,1766],{"class":239}," llm-gateway\n",[222,1768,1769,1772,1775,1778,1781,1784],{"class":224,"line":232},[222,1770,1771],{"class":235},"openssl",[222,1773,1774],{"class":239}," rand",[222,1776,1777],{"class":243}," -hex",[222,1779,1780],{"class":243}," 32",[222,1782,1783],{"class":992}," >",[222,1785,1786],{"class":239}," .master_key\n",[222,1788,1789,1791,1793,1795,1797,1799],{"class":224,"line":268},[222,1790,1771],{"class":235},[222,1792,1774],{"class":239},[222,1794,1777],{"class":243},[222,1796,1780],{"class":243},[222,1798,1783],{"class":992},[222,1800,1801],{"class":239}," .salt_key\n",[222,1803,1804],{"class":224,"line":279},[222,1805,313],{"emptyLinePlaceholder":312},[222,1807,1808],{"class":224,"line":289},[222,1809,1810],{"class":228},"# docker-compose.yml 拉 ghcr.io\u002Fberriai\u002Flitellm:v1.85.0\n",[222,1812,1813],{"class":224,"line":304},[222,1814,1815],{"class":228},"# config.yaml 写 model_list \u002F fallbacks \u002F litellm_settings\n",[222,1817,1818],{"class":224,"line":5},[222,1819,313],{"emptyLinePlaceholder":312},[222,1821,1822,1824,1826,1828],{"class":224,"line":8},[222,1823,236],{"class":235},[222,1825,1139],{"class":239},[222,1827,1142],{"class":239},[222,1829,1145],{"class":243},[222,1831,1832],{"class":224,"line":321},[222,1833,313],{"emptyLinePlaceholder":312},[222,1835,1836],{"class":224,"line":7},[222,1837,1838],{"class":228},"# 生成虚拟 Key\n",[222,1840,1841,1844,1847,1850,1853],{"class":224,"line":332},[222,1842,1843],{"class":235},"curl",[222,1845,1846],{"class":243}," -X",[222,1848,1849],{"class":239}," POST",[222,1851,1852],{"class":239}," http:\u002F\u002Flocalhost:4000\u002Fkey\u002Fgenerate",[222,1854,265],{"class":243},[222,1856,1857,1860,1863,1866,1868],{"class":224,"line":338},[222,1858,1859],{"class":243},"  -H",[222,1861,1862],{"class":239}," \"Authorization: Bearer ",[222,1864,1865],{"class":295},"$LITELLM_MASTER_KEY",[222,1867,1063],{"class":239},[222,1869,265],{"class":243},[222,1871,1872,1875],{"class":224,"line":344},[222,1873,1874],{"class":243},"  -d",[222,1876,1877],{"class":239}," '{\"models\":[\"gpt-5.4\",\"claude-sonnet-4.6\"],\"max_budget\":100}'\n",[222,1879,1880],{"class":224,"line":350},[222,1881,313],{"emptyLinePlaceholder":312},[222,1883,1884],{"class":224,"line":356},[222,1885,1886],{"class":228},"# 业务方调用\n",[222,1888,1890,1892,1895],{"class":224,"line":1889},16,[222,1891,1843],{"class":235},[222,1893,1894],{"class":239}," http:\u002F\u002Flocalhost:4000\u002Fv1\u002Fchat\u002Fcompletions",[222,1896,265],{"class":243},[222,1898,1900,1902,1905],{"class":224,"line":1899},17,[222,1901,1859],{"class":243},[222,1903,1904],{"class":239}," \"Authorization: Bearer sk-xxx\"",[222,1906,265],{"class":243},[222,1908,1910,1912],{"class":224,"line":1909},18,[222,1911,1874],{"class":243},[222,1913,1914],{"class":239}," '{\"model\":\"gpt-5.4\",\"messages\":[...]}'\n",[30,1916,362],{"id":362},[364,1918,1919,1933],{},[367,1920,1921],{},[370,1922,1923,1925,1927,1929,1931],{},[373,1924,375],{},[373,1926,383],{},[373,1928,386],{},[373,1930,11],{},[373,1932,1163],{},[388,1934,1935,1950,1964,1977,1994,2007,2021,2037,2051],{},[370,1936,1937,1940,1943,1946,1948],{},[393,1938,1939],{},"形态",[393,1941,1942],{},"OSS + Enterprise",[393,1944,1945],{},"SaaS",[393,1947,1668],{},[393,1949,1945],{},[370,1951,1952,1955,1958,1960,1962],{},[393,1953,1954],{},"协议",[393,1956,1957],{},"MIT",[393,1959,406],{},[393,1961,1957],{},[393,1963,406],{},[370,1965,1966,1969,1971,1973,1975],{},[393,1967,1968],{},"自托管",[393,1970,417],{},[393,1972,414],{},[393,1974,417],{},[393,1976,905],{},[370,1978,1979,1982,1985,1988,1991],{},[393,1980,1981],{},"模型数",[393,1983,1984],{},"100+",[393,1986,1987],{},"300+",[393,1989,1990],{},"30+",[393,1992,1993],{},"250+",[370,1995,1996,1999,2001,2003,2005],{},[393,1997,1998],{},"虚拟 Key + 预算",[393,2000,417],{},[393,2002,406],{},[393,2004,417],{},[393,2006,417],{},[370,2008,2009,2012,2015,2017,2019],{},[393,2010,2011],{},"Fallback",[393,2013,2014],{},"✅ 三类",[393,2016,417],{},[393,2018,417],{},[393,2020,417],{},[370,2022,2023,2026,2029,2032,2035],{},[393,2024,2025],{},"admin UI",[393,2027,2028],{},"✅ 内置",[393,2030,2031],{},"dashboard",[393,2033,2034],{},"✅ 中文 UI",[393,2036,417],{},[370,2038,2039,2042,2044,2046,2049],{},[393,2040,2041],{},"中文支付",[393,2043,414],{},[393,2045,414],{},[393,2047,2048],{},"✅ EPay 内置",[393,2050,414],{},[370,2052,2053,2056,2059,2061,2064],{},[393,2054,2055],{},"集成观测",[393,2057,2058],{},"Langfuse\u002FProm",[393,2060,2031],{},[393,2062,2063],{},"仪表盘",[393,2065,2066],{},"原生",[30,2068,542],{"id":542},[50,2070,2071,2079,2085,2091,2097,2107,2113,2127],{},[53,2072,2073,1586,2076,2078],{},[56,2074,2075],{},"必固定版本号",[39,2077,1725],{}," \u002F 滚动 tag 在 2026-03 供应链事件后已是禁忌；用带签名验证的具体版本（如 v1.85.0）",[53,2080,2081,2084],{},[56,2082,2083],{},"salt_key 不能轮换","：初始化前生成 + 加密备份",[53,2086,2087,2090],{},[56,2088,2089],{},"Postgres 备份","：所有虚拟 Key + 预算都在 DB，必须定期备份",[53,2092,2093,2096],{},[56,2094,2095],{},"fallback 链别堆超 3 个","：失败叠加延迟 + 计费混乱",[53,2098,2099,2102,2103,2106],{},[56,2100,2101],{},"drop_params 谨慎开","：开 ",[39,2104,2105],{},"drop_params: true"," 会静默丢不兼容字段，调试时容易 confused",[53,2108,2109,2112],{},[56,2110,2111],{},"PII guardrail 不是 0 延迟","：Presidio 调用增 50–100ms，敏感场景再用",[53,2114,2115,2118,2119,2122,2123,2126],{},[56,2116,2117],{},"monorepo + workspace 模型映射","：业务方调 ",[39,2120,2121],{},"gpt-4"," → config 映射到 ",[39,2124,2125],{},"openai\u002Fgpt-5.4-mini","，要规划稳定映射表",[53,2128,2129,2132],{},[56,2130,2131],{},"国内自托管","：BYOK Key 走海外 API 仍然受网络影响，需要部署在能直连厂商的节点",[30,2134,601],{"id":600},[50,2136,2137,2140,2143,2146,2149,2152,2154,2157],{},[53,2138,2139],{},"✅ 中大型团队 \u002F 微服务架构",[53,2141,2142],{},"✅ 合规 \u002F 数据主权要求",[53,2144,2145],{},"✅ 多团队预算治理",[53,2147,2148],{},"✅ 想叠加 Langfuse \u002F Helicone \u002F Prometheus 观测",[53,2150,2151],{},"✅ BYOK 模式跨多厂商",[53,2153,624],{},[53,2155,2156],{},"❌ 国内业务支付 + 中文运营（走 one-api \u002F new-api）",[53,2158,2159],{},"❌ 纯个人项目（SDK 足够，不需要 Proxy）",[30,2161,633],{"id":633},[50,2163,2164,2168,2172,2176],{},[53,2165,2166],{},[639,2167,646],{"href":18},[53,2169,2170],{},[639,2171,1419],{"href":730},[53,2173,2174],{},[639,2175,651],{"href":21},[53,2177,2178],{},[639,2179,656],{"href":24},[30,2181,659],{"id":659},[661,2183,2184,2191,2198,2205],{},[53,2185,2186,2187],{},"NerdLevelTech — LiteLLM Proxy Production Tutorial 2026（含 v1.85.0 + 供应链事件细节）",[639,2188,2189],{"href":2189,"rel":2190},"https:\u002F\u002Fnerdleveltech.com\u002Flitellm-proxy-production-llm-gateway-tutorial",[670],[53,2192,2193,2194],{},"LiteLLM 官方文档 — Fallbacks \u002F Retries \u002F Cooldowns ",[639,2195,2196],{"href":2196,"rel":2197},"https:\u002F\u002Fdocs.litellm.ai\u002Fdocs\u002Fproxy\u002Freliability",[670],[53,2199,2200,2201],{},"Youngju.dev — LiteLLM Complete Guide 2026（SDK vs Proxy \u002F cost-based routing）",[639,2202,2203],{"href":2203,"rel":2204},"https:\u002F\u002Fwww.youngju.dev\u002Fblog\u002Fculture\u002F2026-03-25-litellm-unified-llm-api-proxy-guide-2025.en",[670],[53,2206,2207,2208],{},"GitHub — BerriAI\u002Flitellm README ",[639,2209,2210],{"href":2210,"rel":2211},"https:\u002F\u002Fgithub.com\u002FBerriAI\u002Flitellm",[670],[693,2213,2214],{},"html pre.shiki code .sScJk, html code.shiki .sScJk{--shiki-default:#6F42C1;--shiki-dark:#B392F0}html pre.shiki code .sZZnC, html code.shiki .sZZnC{--shiki-default:#032F62;--shiki-dark:#9ECBFF}html pre.shiki code .sVt8B, html code.shiki .sVt8B{--shiki-default:#24292E;--shiki-dark:#E1E4E8}html pre.shiki code .sj4cs, html code.shiki .sj4cs{--shiki-default:#005CC5;--shiki-dark:#79B8FF}html pre.shiki code .szBVR, html code.shiki .szBVR{--shiki-default:#D73A49;--shiki-dark:#F97583}html pre.shiki code .sJ8bj, html code.shiki .sJ8bj{--shiki-default:#6A737D;--shiki-dark:#6A737D}html .default .shiki span {color: var(--shiki-default);background: var(--shiki-default-bg);font-style: var(--shiki-default-font-style);font-weight: var(--shiki-default-font-weight);text-decoration: var(--shiki-default-text-decoration);}html .shiki span {color: var(--shiki-default);background: var(--shiki-default-bg);font-style: var(--shiki-default-font-style);font-weight: var(--shiki-default-font-weight);text-decoration: var(--shiki-default-text-decoration);}html .dark .shiki span {color: var(--shiki-dark);background: var(--shiki-dark-bg);font-style: var(--shiki-dark-font-style);font-weight: var(--shiki-dark-font-weight);text-decoration: var(--shiki-dark-text-decoration);}html.dark .shiki span {color: var(--shiki-dark);background: var(--shiki-dark-bg);font-style: var(--shiki-dark-font-style);font-weight: var(--shiki-dark-font-weight);text-decoration: var(--shiki-dark-text-decoration);}",{"title":218,"searchDepth":268,"depth":268,"links":2216},[2217,2218,2219,2220,2221,2222,2223,2224,2225,2226],{"id":32,"depth":232,"text":33},{"id":48,"depth":232,"text":48},{"id":122,"depth":232,"text":122},{"id":1685,"depth":232,"text":1686},{"id":1745,"depth":232,"text":1746},{"id":362,"depth":232,"text":362},{"id":542,"depth":232,"text":542},{"id":600,"depth":232,"text":601},{"id":633,"depth":232,"text":633},{"id":659,"depth":232,"text":659},"\u002Fimg\u002Ftools\u002Flitellm.webp","LiteLLM 真实评测：MIT 开源 LLM 网关，BerriAI 维护。SDK 模式（pip install litellm）+ Proxy 模式（Docker Compose 自托管）双形态，100+ 厂商统一 OpenAI 接口，虚拟 Key + 团队预算 + 三类 fallback + 成本追踪 + 内置 UI。2026-03 经历供应链事件后 v1.83+ 强化签名 + 镜像验证，生产请固定版本号。",[2230,2233,2236,2239],{"q":2231,"a":2232},"SDK 和 Proxy 模式区别？","SDK 模式（`from litellm import completion`）直接在 Python 里调，适合个人项目 \u002F 单服务。Proxy 模式启动一个 HTTP 服务（默认 4000 端口）+ Postgres，所有应用通过 OpenAI 兼容 endpoint 调用，支持虚拟 Key \u002F 团队 \u002F 预算 \u002F 配额 \u002F admin UI——团队 \u002F 多语言客户端 \u002F 生产建议走 Proxy。",{"q":2234,"a":2235},"Fallback 有几种？","三类：(1) general fallback——5xx\u002F429 错误切到备用模型；(2) content policy fallback——内容审查拒绝时切；(3) context window fallback——输入超 context 切大窗口模型（比如超 GPT-4 32k 自动切 Claude 200k）。可叠加 num_retries \u002F cooldown \u002F timeout 做完整 SRE 策略。",{"q":2237,"a":2238},"2026-03 供应链事件是什么？","2026-03-24 PyPI 上的 v1.82.7 \u002F v1.82.8 在被替换约 40 分钟内可能植入 Trivy CI token 外泄代码。BerriAI 在 v1.83+ 强化签名 + 镜像验证，生产部署务必固定到带签名验证的版本（如 v1.85.0），不要用 `:latest` tag。",{"q":2240,"a":2241},"和 OpenRouter 怎么选？","OpenRouter = SaaS（不用自己运维 + 直接付钱）；LiteLLM = OSS 自托管（自付服务器 + 完全控制数据 + BYOK 所有 Key）。中大型团队 \u002F 合规 \u002F 长期成本敏感 \u002F 自建 → LiteLLM Proxy；小团队 \u002F 不想运维 \u002F 快速迭代 → OpenRouter。",[728],{},[1493,1533,236,2245],"kubernetes",[2247,2251],{"plan":2248,"price":738,"features":2249,"notes":2250},"Open Source","SDK + Proxy + Postgres 虚拟 Key + 预算 + fallback + admin UI + 100+ providers","完全自托管，模型 \u002F 平台费走自付",{"plan":905,"price":1507,"features":2252,"notes":2253},"SSO \u002F SAML + Audit + JWT auth + 高级路由 + SLA + on-prem 部署支持","联系 BerriAI 销售","MIT 开源免费 \u002F Enterprise SaaS 定制",[2256],{"name":1513,"url":1514},{"power":289,"ux":279,"price":289,"cn_support":268,"stability":279},{"title":383,"description":2228},"coding\u002Fapi\u002Flitellm",[2261,2263,2265,2267],{"name":2262,"url":2189,"accessed":757},"NerdLevelTech — LiteLLM Proxy 生产教程 2026",{"name":2264,"url":2196,"accessed":757},"LiteLLM 官方文档 — Fallbacks",{"name":2266,"url":2203,"accessed":757},"Youngju.dev — LiteLLM Complete Guide 2026",{"name":2268,"url":2210,"accessed":757},"GitHub — BerriAI\u002Flitellm","tools\u002Fcoding\u002Fapi\u002Flitellm","MIT 开源 LLM 网关——SDK + Proxy 双形态，100+ 厂商统一 OpenAI 接口 + 虚拟 Key + 团队预算",[767,1533,1493,768,769,2272,2273,2274],"fallback","virtual-keys","byok","想要『SaaS 体验 + 完全自托管』的开源 LLM 网关首选。组合『LiteLLM 网关 + Helicone\u002FLangfuse 观测』在中大型 dev org 是黄金组合。中文中转 + 业务支付走 one-api。","https:\u002F\u002Fwww.litellm.ai","6bZL9hkjSKgSreq6sFAHStozW6QAMnwdxy4__FnhQho",{"id":10,"title":11,"alternatives":2279,"api_compatible":25,"body":2284,"category":708,"chinese_friendly":289,"cover":709,"description":710,"domestic":711,"extension":712,"faq":2762,"free":711,"github":25,"languages":2767,"meta":2768,"models":25,"navigation":312,"notSuitable":25,"opensource":312,"path":730,"pillar":731,"platforms":2769,"priceTable":2770,"pricing":129,"published":746,"relatedPlaybooks":2773,"relatedReviews":25,"score":2775,"self_host":312,"seo":2776,"slug":753,"sources":2777,"stem":764,"suitable":25,"tagline":765,"tags":2782,"updated":757,"verdict":774,"website":683,"__hash__":775},[2280,2281,2282,2283],{"name":14,"url":15},{"name":17,"url":18},{"name":20,"url":21},{"name":23,"url":24},{"type":27,"value":2285,"toc":2750},[2286,2288,2292,2294,2296,2342,2344,2354,2358,2360,2364,2382,2386,2404,2406,2502,2504,2642,2644,2682,2684,2704,2706,2724,2726,2748],[30,2287,33],{"id":32},[35,2289,37,2290,42],{},[39,2291,41],{},[35,2293,45],{},[30,2295,48],{"id":48},[50,2297,2298,2302,2306,2310,2314,2318,2322,2326,2330,2334,2338],{},[53,2299,2300,59],{},[56,2301,58],{},[53,2303,2304,65],{},[56,2305,64],{},[53,2307,2308,71],{},[56,2309,70],{},[53,2311,2312,77],{},[56,2313,76],{},[53,2315,2316,83],{},[56,2317,82],{},[53,2319,2320,89],{},[56,2321,88],{},[53,2323,2324,95],{},[56,2325,94],{},[53,2327,2328,101],{},[56,2329,100],{},[53,2331,2332,107],{},[56,2333,106],{},[53,2335,2336,113],{},[56,2337,112],{},[53,2339,2340,119],{},[56,2341,118],{},[30,2343,122],{"id":122},[50,2345,2346,2350,2352],{},[53,2347,2348,130],{},[56,2349,129],{},[53,2351,133],{},[53,2353,136],{},[138,2355,2356],{},[35,2357,142],{},[30,2359,146],{"id":145},[35,2361,2362],{},[56,2363,151],{},[50,2365,2366,2370,2372,2374,2376,2378,2380],{},[53,2367,2368,158],{},[39,2369,41],{},[53,2371,161],{},[53,2373,164],{},[53,2375,167],{},[53,2377,170],{},[53,2379,173],{},[53,2381,176],{},[35,2383,2384],{},[56,2385,181],{},[50,2387,2388,2390,2392,2394,2396,2398,2400,2402],{},[53,2389,186],{},[53,2391,189],{},[53,2393,192],{},[53,2395,195],{},[53,2397,198],{},[53,2399,201],{},[53,2401,204],{},[53,2403,207],{},[30,2405,211],{"id":210},[213,2407,2408],{"className":215,"code":216,"language":217,"meta":218,"style":218},[39,2409,2410,2414,2436,2444,2452,2462,2466,2470,2474,2478,2482,2486,2490,2494,2498],{"__ignoreMap":218},[222,2411,2412],{"class":224,"line":225},[222,2413,229],{"class":228},[222,2415,2416,2418,2420,2422,2424,2426,2428,2430,2432,2434],{"class":224,"line":232},[222,2417,236],{"class":235},[222,2419,240],{"class":239},[222,2421,244],{"class":243},[222,2423,247],{"class":239},[222,2425,250],{"class":243},[222,2427,253],{"class":243},[222,2429,256],{"class":239},[222,2431,259],{"class":243},[222,2433,262],{"class":239},[222,2435,265],{"class":243},[222,2437,2438,2440,2442],{"class":224,"line":268},[222,2439,271],{"class":243},[222,2441,274],{"class":239},[222,2443,265],{"class":243},[222,2445,2446,2448,2450],{"class":224,"line":279},[222,2447,271],{"class":243},[222,2449,284],{"class":239},[222,2451,265],{"class":243},[222,2453,2454,2456,2458,2460],{"class":224,"line":289},[222,2455,292],{"class":243},[222,2457,296],{"class":295},[222,2459,299],{"class":239},[222,2461,265],{"class":243},[222,2463,2464],{"class":224,"line":304},[222,2465,307],{"class":239},[222,2467,2468],{"class":224,"line":5},[222,2469,313],{"emptyLinePlaceholder":312},[222,2471,2472],{"class":224,"line":8},[222,2473,318],{"class":228},[222,2475,2476],{"class":224,"line":321},[222,2477,324],{"class":228},[222,2479,2480],{"class":224,"line":7},[222,2481,329],{"class":228},[222,2483,2484],{"class":224,"line":332},[222,2485,335],{"class":228},[222,2487,2488],{"class":224,"line":338},[222,2489,341],{"class":228},[222,2491,2492],{"class":224,"line":344},[222,2493,347],{"class":228},[222,2495,2496],{"class":224,"line":350},[222,2497,353],{"class":228},[222,2499,2500],{"class":224,"line":356},[222,2501,359],{"class":228},[30,2503,362],{"id":362},[364,2505,2506,2520],{},[367,2507,2508],{},[370,2509,2510,2512,2514,2516,2518],{},[373,2511,375],{},[373,2513,11],{},[373,2515,380],{},[373,2517,383],{},[373,2519,386],{},[388,2521,2522,2534,2546,2558,2570,2582,2594,2606,2618,2630],{},[370,2523,2524,2526,2528,2530,2532],{},[393,2525,395],{},[393,2527,398],{},[393,2529,398],{},[393,2531,403],{},[393,2533,406],{},[370,2535,2536,2538,2540,2542,2544],{},[393,2537,411],{},[393,2539,414],{},[393,2541,417],{},[393,2543,420],{},[393,2545,414],{},[370,2547,2548,2550,2552,2554,2556],{},[393,2549,427],{},[393,2551,414],{},[393,2553,417],{},[393,2555,406],{},[393,2557,406],{},[370,2559,2560,2562,2564,2566,2568],{},[393,2561,440],{},[393,2563,414],{},[393,2565,445],{},[393,2567,414],{},[393,2569,450],{},[370,2571,2572,2574,2576,2578,2580],{},[393,2573,455],{},[393,2575,458],{},[393,2577,458],{},[393,2579,406],{},[393,2581,406],{},[370,2583,2584,2586,2588,2590,2592],{},[393,2585,469],{},[393,2587,417],{},[393,2589,417],{},[393,2591,476],{},[393,2593,476],{},[370,2595,2596,2598,2600,2602,2604],{},[393,2597,483],{},[393,2599,486],{},[393,2601,486],{},[393,2603,491],{},[393,2605,494],{},[370,2607,2608,2610,2612,2614,2616],{},[393,2609,499],{},[393,2611,414],{},[393,2613,417],{},[393,2615,417],{},[393,2617,508],{},[370,2619,2620,2622,2624,2626,2628],{},[393,2621,513],{},[393,2623,516],{},[393,2625,519],{},[393,2627,522],{},[393,2629,406],{},[370,2631,2632,2634,2636,2638,2640],{},[393,2633,529],{},[393,2635,532],{},[393,2637,532],{},[393,2639,537],{},[393,2641,406],{},[30,2643,542],{"id":542},[50,2645,2646,2650,2654,2658,2662,2666,2670,2674,2678],{},[53,2647,2648],{},[56,2649,549],{},[53,2651,2652,555],{},[56,2653,554],{},[53,2655,2656,561],{},[56,2657,560],{},[53,2659,2660,567],{},[56,2661,566],{},[53,2663,2664,573],{},[56,2665,572],{},[53,2667,2668,579],{},[56,2669,578],{},[53,2671,2672,585],{},[56,2673,584],{},[53,2675,2676,591],{},[56,2677,590],{},[53,2679,2680,597],{},[56,2681,596],{},[30,2683,601],{"id":600},[50,2685,2686,2688,2690,2692,2694,2696,2698,2700,2702],{},[53,2687,606],{},[53,2689,609],{},[53,2691,612],{},[53,2693,615],{},[53,2695,618],{},[53,2697,621],{},[53,2699,624],{},[53,2701,627],{},[53,2703,630],{},[30,2705,633],{"id":633},[50,2707,2708,2712,2716,2720],{},[53,2709,2710],{},[639,2711,641],{"href":15},[53,2713,2714],{},[639,2715,646],{"href":18},[53,2717,2718],{},[639,2719,651],{"href":21},[53,2721,2722],{},[639,2723,656],{"href":24},[30,2725,659],{"id":659},[661,2727,2728,2733,2738,2743],{},[53,2729,665,2730],{},[639,2731,668],{"href":668,"rel":2732},[670],[53,2734,673,2735],{},[639,2736,676],{"href":676,"rel":2737},[670],[53,2739,680,2740],{},[639,2741,683],{"href":683,"rel":2742},[670],[53,2744,687,2745],{},[639,2746,690],{"href":690,"rel":2747},[670],[693,2749,695],{},{"title":218,"searchDepth":268,"depth":268,"links":2751},[2752,2753,2754,2755,2756,2757,2758,2759,2760,2761],{"id":32,"depth":232,"text":33},{"id":48,"depth":232,"text":48},{"id":122,"depth":232,"text":122},{"id":145,"depth":232,"text":146},{"id":210,"depth":232,"text":211},{"id":362,"depth":232,"text":362},{"id":542,"depth":232,"text":542},{"id":600,"depth":232,"text":601},{"id":633,"depth":232,"text":633},{"id":659,"depth":232,"text":659},[2763,2764,2765,2766],{"q":715,"a":716},{"q":718,"a":719},{"q":721,"a":722},{"q":724,"a":725},[727,728],{},[236,733,734],[2771,2772],{"plan":737,"price":738,"features":739,"notes":740},{"plan":742,"price":743,"features":744,"notes":745},[2774],{"name":749,"url":750},{"power":279,"ux":279,"price":289,"cn_support":289,"stability":279},{"title":11,"description":710},[2778,2779,2780,2781],{"name":756,"url":668,"accessed":757},{"name":759,"url":676,"accessed":757},{"name":761,"url":683,"accessed":757},{"name":763,"url":690,"accessed":757},[767,768,769,770,771,772,773],{"id":2784,"title":386,"alternatives":2785,"api_compatible":25,"body":2790,"category":708,"chinese_friendly":232,"cover":3248,"description":3249,"domestic":711,"extension":712,"faq":3250,"free":711,"github":25,"languages":3263,"meta":3264,"models":25,"navigation":312,"notSuitable":25,"opensource":711,"path":18,"pillar":731,"platforms":3265,"priceTable":3266,"pricing":3281,"published":746,"relatedPlaybooks":3282,"relatedReviews":25,"score":3285,"self_host":711,"seo":3286,"slug":3287,"sources":3288,"stem":3297,"suitable":25,"tagline":3298,"tags":3299,"updated":757,"verdict":3303,"website":3304,"__hash__":3305},"tools\u002Ftools\u002Fcoding\u002Fapi\u002Fopenrouter.md",[2786,2787,2788,2789],{"name":14,"url":15},{"name":788,"url":730},{"name":20,"url":21},{"name":23,"url":24},{"type":27,"value":2791,"toc":3236},[2792,2794,2797,2800,2802,2876,2878,2907,2912,2916,2920,2937,2942,2966,2968,3000,3002,3113,3115,3153,3155,3184,3186,3204,3206],[30,2793,33],{"id":32},[35,2795,2796],{},"OpenRouter 是 AI API 聚合先驱——一个 OpenAI 兼容 endpoint + 一个 Key，调 60+ 厂商 300+ 模型，5M+ 用户。模型 passthrough 定价 0 markup，但充值有 5.5% 信用卡平台费（$0.80 最低）+ BYOK 月 100 万请求后 5%。自动 fallback \u002F playground \u002F 海量模型选型是杀手锏。国内直连延迟 1500–3000ms + 不支持支付宝是硬伤。",[35,2798,2799],{},"适合：海外开发者；多模型选型 \u002F 横评；生产 fallback 高可用；零迁移成本（OpenAI SDK 改 baseURL）。不适合：国内对延迟敏感的 AI 编程工具（用 OfoxAI \u002F 自建中转）；要支付宝 \u002F 微信 \u002F 银联；要 self-host（用 one-api \u002F LiteLLM）。",[30,2801,48],{"id":48},[50,2803,2804,2810,2819,2830,2840,2846,2852,2858,2864,2870],{},[53,2805,2806,2809],{},[56,2807,2808],{},"60+ 厂商 300+ 模型","：OpenAI \u002F Anthropic \u002F Google \u002F Meta \u002F DeepSeek \u002F MiniMax \u002F Mistral \u002F Cohere \u002F xAI \u002F NVIDIA \u002F Qwen \u002F 字节豆包 等",[53,2811,2812,1586,2815,2818],{},[56,2813,2814],{},"OpenAI 兼容 endpoint",[39,2816,2817],{},"https:\u002F\u002Fopenrouter.ai\u002Fapi\u002Fv1","，SDK 改 baseURL 即用",[53,2820,2821,1586,2824,2826,2827,1599],{},[56,2822,2823],{},"模型 ID 格式",[39,2825,1738],{},"（如 ",[39,2828,2829],{},"anthropic\u002Fclaude-sonnet-4.6",[53,2831,2832,2835,2836,2839],{},[56,2833,2834],{},"自动 fallback","：请求里列 ",[39,2837,2838],{},"models: [...]","，前者失败自动切后者",[53,2841,2842,2845],{},[56,2843,2844],{},"Playground","：5 模型并排测同 prompt + 成本 + 延迟 + 输出",[53,2847,2848,2851],{},[56,2849,2850],{},"BYOK","：自带 OpenAI \u002F Anthropic Key，OpenRouter 只做网关；前 100 万 req\u002F月免费，超 5% fee",[53,2853,2854,2857],{},[56,2855,2856],{},"Passthrough 定价","：模型按厂商官方价",[53,2859,2860,2863],{},[56,2861,2862],{},"免费模型","：Llama 4 Scout \u002F DeepSeek V4 Flash \u002F Qwen3 Coder \u002F Gemma 3 等，每日 5\u002F200 次",[53,2865,2866,2869],{},[56,2867,2868],{},"Provider ranking \u002F SLA","：dashboard 看每家 provider 延迟 + 错误率",[53,2871,2872,2875],{},[56,2873,2874],{},"Rankings 页","：模型按 token 消耗排名（市场热度参考）",[30,2877,122],{"id":122},[50,2879,2880,2886,2892,2897,2902],{},[53,2881,2882,2885],{},[56,2883,2884],{},"Free","：$1 credit + 免费模型 5\u002F日 + 标准限流",[53,2887,2888,2891],{},[56,2889,2890],{},"Pay-as-you-go","：模型 passthrough + 5.5% 卡费（最低 $0.80）+ 充值 $5 后免费模型涨到 200\u002F日",[53,2893,2894,2896],{},[56,2895,899],{},"：$99\u002F月 + Priority routing + 99.9% SLA",[53,2898,2899,2901],{},[56,2900,905],{},"：Custom 专属基础设施",[53,2903,2904,2906],{},[56,2905,2850],{},"：前 100 万 req\u002F月免费，超出 5%",[138,2908,2909],{},[35,2910,2911],{},"实际总成本 ≈ 模型价 × (1 + 5.5%) + BYOK 5% × 月 >1M 部分。预算按 5–7% overhead 算。",[30,2913,2915],{"id":2914},"实测小型-saas-后端-海外节点","实测（小型 SaaS 后端 \u002F 海外节点）",[35,2917,2918],{},[56,2919,151],{},[50,2921,2922,2925,2928,2931,2934],{},[53,2923,2924],{},"5 分钟接入，OpenAI SDK 改两行配置",[53,2926,2927],{},"Playground 横评新模型省一大堆 boilerplate",[53,2929,2930],{},"自动 fallback 救命：Anthropic 4 小时宕机时应用零中断",[53,2932,2933],{},"模型 ID 提示器 + Rankings 看市场热度方便选型",[53,2935,2936],{},"海外节点延迟 300–600ms，CDN 体感好",[35,2938,2939],{},[56,2940,2941],{},"踩坑（国内）：",[50,2943,2944,2947,2950,2953,2960,2963],{},[53,2945,2946],{},"国内直连 1500–3000ms + 高峰超时率明显，Cursor \u002F Claude Code 高频调用体感糟",[53,2948,2949],{},"不支持支付宝 \u002F 微信 \u002F 银联，只 Visa\u002FMastercard \u002F USDC",[53,2951,2952],{},"信用卡费 5.5% 最低 $0.80，\u003C$15 充值实际打到 10%+",[53,2954,2955,2956,2959],{},"模型 ID 点号分隔（",[39,2957,2958],{},"claude-sonnet-4.6","）易跟连字符混",[53,2961,2962],{},"Claude Code 默认走 Anthropic 原生协议，OpenRouter 适配偶有不一致",[53,2964,2965],{},"「免费模型」rate limit 后可能静默切付费",[30,2967,975],{"id":975},[661,2969,2970,2973,2976,2979,2985,2991,2997],{},[53,2971,2972],{},"openrouter.ai → Google \u002F GitHub OAuth 注册",[53,2974,2975],{},"Keys → 创建 API Key（sk-or-xxx）",[53,2977,2978],{},"充值 $10+（Visa \u002F Mastercard \u002F USDC）→ 解锁更高免费配额",[53,2980,2981,2982],{},"代码：",[39,2983,2984],{},"OpenAI(baseURL='https:\u002F\u002Fopenrouter.ai\u002Fapi\u002Fv1', api_key=KEY)",[53,2986,2987,2988,2990],{},"模型用 ",[39,2989,1738],{}," 格式",[53,2992,2993,2994],{},"加 fallback：",[39,2995,2996],{},"extra_body={\"models\": [\"anthropic\u002Fclaude-sonnet-4.6\", \"openai\u002Fgpt-5.4\"]}",[53,2998,2999],{},"Playground 横评再批量切",[30,3001,362],{"id":362},[364,3003,3004,3018],{},[367,3005,3006],{},[370,3007,3008,3010,3012,3014,3016],{},[373,3009,375],{},[373,3011,386],{},[373,3013,383],{},[373,3015,11],{},[373,3017,1163],{},[388,3019,3020,3033,3045,3057,3069,3081,3097],{},[370,3021,3022,3024,3026,3029,3031],{},[393,3023,1939],{},[393,3025,1945],{},[393,3027,3028],{},"OSS + SaaS",[393,3030,1668],{},[393,3032,1945],{},[370,3034,3035,3037,3039,3041,3043],{},[393,3036,1981],{},[393,3038,1987],{},[393,3040,1984],{},[393,3042,1990],{},[393,3044,1993],{},[370,3046,3047,3049,3051,3053,3055],{},[393,3048,1968],{},[393,3050,414],{},[393,3052,417],{},[393,3054,417],{},[393,3056,905],{},[370,3058,3059,3061,3063,3065,3067],{},[393,3060,2041],{},[393,3062,414],{},[393,3064,406],{},[393,3066,417],{},[393,3068,406],{},[370,3070,3071,3073,3075,3077,3079],{},[393,3072,2011],{},[393,3074,417],{},[393,3076,417],{},[393,3078,417],{},[393,3080,417],{},[370,3082,3083,3086,3089,3092,3094],{},[393,3084,3085],{},"国内延迟",[393,3087,3088],{},"1500–3000ms",[393,3090,3091],{},"自托管自定",[393,3093,3091],{},[393,3095,3096],{},"海外为主",[370,3098,3099,3102,3105,3108,3110],{},[393,3100,3101],{},"成本",[393,3103,3104],{},"模型 + 5.5%\u002FBYOK 5%",[393,3106,3107],{},"自付服务器",[393,3109,3107],{},[393,3111,3112],{},"按 logs 计费",[30,3114,542],{"id":542},[50,3116,3117,3123,3129,3135,3141,3147],{},[53,3118,3119,3122],{},[56,3120,3121],{},"国内别裸用","：1500ms+ 起、超时率高，主链路上 OfoxAI \u002F 自建 one-api 中转，OpenRouter 当冷门模型补",[53,3124,3125,3128],{},[56,3126,3127],{},"预算多算 5–7%","：5.5% 信用卡 + BYOK 5% + 偶发汇率",[53,3130,3131,3134],{},[56,3132,3133],{},"免费模型生产慎用","：rate limit 后可能静默 fallback 付费，账单失控",[53,3136,3137,3140],{},[56,3138,3139],{},"模型 ID 格式坑","：点号 vs 连字符要测；新模型 ID 改名要监控",[53,3142,3143,3146],{},[56,3144,3145],{},"fallback 别堆太多","：5+ fallback 一次失败延迟叠加可能 10s+，前 2 个即可",[53,3148,3149,3152],{},[56,3150,3151],{},"Claude Code 原生模式建议直连","：OpenRouter 走 OpenAI 兼容协议有时与原生 Anthropic 协议有出入",[30,3154,601],{"id":600},[50,3156,3157,3160,3163,3166,3169,3172,3175,3178,3181],{},[53,3158,3159],{},"✅ 海外开发者 \u002F 跨境业务",[53,3161,3162],{},"✅ 多模型选型 \u002F 横评",[53,3164,3165],{},"✅ 生产 fallback 高可用",[53,3167,3168],{},"✅ 零迁移成本（OpenAI SDK 改 baseURL）",[53,3170,3171],{},"✅ BYOK 模式给团队统一 Key 管理",[53,3173,3174],{},"❌ 国内 AI 编程工具（Cursor \u002F Claude Code）高频调用",[53,3176,3177],{},"❌ 要支付宝 \u002F 微信 \u002F 银联",[53,3179,3180],{},"❌ Self-host \u002F 完全控制数据",[53,3182,3183],{},"❌ 极致低延迟实时应用",[30,3185,633],{"id":633},[50,3187,3188,3192,3196,3200],{},[53,3189,3190],{},[639,3191,641],{"href":15},[53,3193,3194],{},[639,3195,1419],{"href":730},[53,3197,3198],{},[639,3199,651],{"href":21},[53,3201,3202],{},[639,3203,656],{"href":24},[30,3205,659],{"id":659},[661,3207,3208,3215,3222,3229],{},[53,3209,3210,3211],{},"OfoxAI — OpenRouter 完全指南 2026（国内延迟实测 + 替代方案）",[639,3212,3213],{"href":3213,"rel":3214},"https:\u002F\u002Fofox.ai\u002Fzh\u002Fblog\u002Fopenrouter-complete-guide-china-developers-2026",[670],[53,3216,3217,3218],{},"OfoxAI — OpenRouter Pricing 2026 Hidden Markup Breakdown ",[639,3219,3220],{"href":3220,"rel":3221},"https:\u002F\u002Fofox.ai\u002Fblog\u002Fopenrouter-pricing-hidden-markup-breakdown-2026\u002F",[670],[53,3223,3224,3225],{},"DigitalApplied — OpenRouter June 2026 New Models & Pricing Roundup ",[639,3226,3227],{"href":3227,"rel":3228},"https:\u002F\u002Fwww.digitalapplied.com\u002Fblog\u002Fopenrouter-new-models-june-2026-roundup-pricing-rankings",[670],[53,3230,3231,3232],{},"AIToolBox — OpenRouter Review 2026 ",[639,3233,3234],{"href":3234,"rel":3235},"https:\u002F\u002Fwww.aitoolbox.hk\u002Ftools\u002Fopen-router\u002F",[670],{"title":218,"searchDepth":268,"depth":268,"links":3237},[3238,3239,3240,3241,3242,3243,3244,3245,3246,3247],{"id":32,"depth":232,"text":33},{"id":48,"depth":232,"text":48},{"id":122,"depth":232,"text":122},{"id":2914,"depth":232,"text":2915},{"id":975,"depth":232,"text":975},{"id":362,"depth":232,"text":362},{"id":542,"depth":232,"text":542},{"id":600,"depth":232,"text":601},{"id":633,"depth":232,"text":633},{"id":659,"depth":232,"text":659},"\u002Fimg\u002Ftools\u002Fopenrouter.webp","OpenRouter 真实评测：AI API 聚合先驱，60+ 厂商 300+ 模型一个 OpenAI 兼容 endpoint。passthrough 定价 0 markup + 5.5% 信用卡平台费（$0.80 最低）+ BYOK 5% 月千万请求外。Pay-as-you-go \u002F Team $99\u002F月 SLA \u002F Enterprise。国内直连 1500–3000ms 高峰超时多。",[3251,3254,3257,3260],{"q":3252,"a":3253},"国内能用吗？","技术上能（OpenAI SDK 改 baseURL），但服务器在海外、无国内节点：实测首 Token 延迟代理 600–1200ms \u002F 直连 1500–3000ms 且不稳，高峰超时率高。AI 编程类高频调用（Cursor \u002F Claude Code \u002F Cline）国内体验糟糕，主流方案是用 OfoxAI \u002F 自建 one-api\u002Fnew-api 中转。",{"q":3255,"a":3256},"真的零 markup 吗？","模型本身按厂商官方价 passthrough，技术上 0 markup。但充值有两层平台费：信用卡 5.5%（最低 $0.80，小额充值实际打到 10–20%）、BYOK 月 100 万请求后 5%。预算时按上层多算 5–7%。",{"q":3258,"a":3259},"自动 fallback 怎么用？","请求里加 `models: ['anthropic\u002Fclaude-sonnet-4.6', 'openai\u002Fgpt-5.4']`，前者失败 \u002F 超时 \u002F 限流时自动切到后者。生产 24h+ 不间断 AI 服务几乎刚需——Anthropic 2026 年 5 月 4 小时宕机，用 fallback 的应用零中断。",{"q":3261,"a":3262},"免费模型怎么用？","模型列表筛选 $0 价（如 Llama 4 Scout \u002F DeepSeek V4 Flash \u002F Qwen3 Coder \u002F Gemma 3）。未充值每日 5 次，充 $5+ 涨到 200 次\u002F日，附带 20 req\u002Fmin。生产别依赖免费模型，限流 \u002F 排队 \u002F 暗切付费会让计费失控。",[728,727],{},[708,1493],[3267,3270,3274,3278],{"plan":2884,"price":743,"features":3268,"notes":3269},"$1 credit + 免费模型 5\u002F日 + 标准限流","不需要信用卡",{"plan":2890,"price":3271,"features":3272,"notes":3273},"Passthrough + 5.5% 卡费","300+ 模型 + 标准限流 + 充 $5 后免费模型 200\u002F日 + BYOK","信用卡平台费最低 $0.80",{"plan":899,"price":3275,"features":3276,"notes":3277},"$99\u002F月","Priority routing + 99.9% SLA + 更高限流","面向生产应用",{"plan":905,"price":1507,"features":3279,"notes":3280},"专属基础设施 + 自定义合同","大规模生产","免费 $1 credit + 5\u002F日 → 200\u002F日（充 $5+） \u002F Pay-as-you-go passthrough + 5.5% 卡费 \u002F Team $99\u002F月 SLA \u002F Enterprise",[3283,3284],{"name":1513,"url":1514},{"name":749,"url":750},{"power":289,"ux":279,"price":279,"cn_support":232,"stability":279},{"title":386,"description":3249},"coding\u002Fapi\u002Fopenrouter",[3289,3291,3293,3295],{"name":3290,"url":3213,"accessed":757},"OfoxAI — OpenRouter 完全指南 2026",{"name":3292,"url":3220,"accessed":757},"OfoxAI — OpenRouter Pricing Hidden Markup",{"name":3294,"url":3227,"accessed":757},"DigitalApplied — OpenRouter June 2026 Roundup",{"name":3296,"url":3234,"accessed":757},"AIToolBox — OpenRouter Review 2026","tools\u002Fcoding\u002Fapi\u002Fopenrouter","AI API 聚合先驱——一个 Key + 一个 endpoint 调 300+ 模型，自动 fallback，OpenAI 兼容",[3300,3301,772,2272,3302,2274],"api-gateway","aggregator","multi-model","AI API 聚合的全球事实标准——300+ 模型 \u002F 一个 Key \u002F 自动 fallback。海外开发者首选；国内开发者延迟 1500–3000ms + 不支持支付宝是硬伤，主走 OfoxAI \u002F one-api 自建中转。","https:\u002F\u002Fopenrouter.ai","lBVa44g4os32dXajidARdkCKHABk2aYo8KxAqV2iGfk",{"id":3307,"title":1163,"alternatives":3308,"api_compatible":25,"body":3313,"category":708,"chinese_friendly":232,"cover":4041,"description":4042,"domestic":711,"extension":712,"faq":4043,"free":711,"github":25,"languages":4056,"meta":4057,"models":25,"navigation":312,"notSuitable":25,"opensource":312,"path":21,"pillar":731,"platforms":4058,"priceTable":4059,"pricing":4075,"published":746,"relatedPlaybooks":4076,"relatedReviews":25,"score":4078,"self_host":312,"seo":4079,"slug":4080,"sources":4081,"stem":4089,"suitable":25,"tagline":4090,"tags":4091,"updated":757,"verdict":4096,"website":4097,"__hash__":4098},"tools\u002Ftools\u002Fcoding\u002Fapi\u002Fportkey.md",[3309,3310,3311,3312],{"name":23,"url":24},{"name":14,"url":15},{"name":17,"url":18},{"name":788,"url":730},{"type":27,"value":3314,"toc":4029},[3315,3317,3320,3323,3325,3417,3419,3448,3453,3457,3461,3481,3485,3507,3509,3710,3712,3892,3894,3944,3946,3975,3977,3995,3997,4026],[30,3316,33],{"id":32},[35,3318,3319],{},"Portkey 把 AI 网关（250+ 模型 + fallback + 路由 + 缓存）和 LLM 全栈观测（40+ 维度 + 成本归因 + tracing + auto-instrumentation）做成同一个 SaaS，再加 MCP Gateway 让 AI agent 工具调用可追溯——目标是中大型团队从 PoC 走向生产的『AI 控制面板』。2026 年 Palo Alto Networks 完成收购，附带 SOC2 Type 2 + HIPAA + GDPR + ISO 27001 合规背书。3000+ GenAI 团队使用，1T tokens\u002F天里程碑。",[35,3321,3322],{},"适合：从 PoC 走向生产的中大型团队；要 SOC2\u002FHIPAA\u002FHIPAA\u002FGDPR 强合规；多团队 RBAC + budgets + 治理；大规模 AI agent 部署需要 MCP 工具调用可追溯。不适合：深度 nested span tracing（用 Langfuse）；纯网关不要观测（用 LiteLLM）；中文支付 \u002F 中文 UI（用 one-api \u002F new-api）；预算极紧的小项目（10K log 免费 + Pro $79 但深度有限，Helicone 同档更轻）。",[30,3324,48],{"id":48},[50,3326,3327,3333,3339,3345,3350,3356,3362,3368,3374,3379,3385,3390,3395,3399,3405,3411],{},[53,3328,3329,3332],{},[56,3330,3331],{},"250+ 模型 unified API","：OpenAI \u002F Anthropic \u002F Google \u002F AWS Bedrock \u002F Azure \u002F Cohere \u002F 等",[53,3334,3335,3338],{},[56,3336,3337],{},"Fallback \u002F Load Balancing \u002F Conditional Routing","：跨 provider 高可用",[53,3340,3341,3344],{},[56,3342,3343],{},"Semantic + simple caching","：减延迟 + 降成本",[53,3346,3347,1620],{},[56,3348,3349],{},"Retries \u002F circuit breakers",[53,3351,3352,3355],{},[56,3353,3354],{},"Full-stack Observability","：40+ 维度 logs \u002F traces \u002F metrics",[53,3357,3358,3361],{},[56,3359,3360],{},"OpenTelemetry 兼容","：导出到现有 APM",[53,3363,3364,3367],{},[56,3365,3366],{},"Tracing","：跨 LLM call + tool use 统一时序视图",[53,3369,3370,3373],{},[56,3371,3372],{},"Auto-instrumentation","：自动埋点多个 LLM \u002F agent 框架",[53,3375,3376],{},[56,3377,3378],{},"Prompt management + templates",[53,3380,3381,3384],{},[56,3382,3383],{},"MCP Gateway（GA）","：AI agent 工具调用统一访问 + 审计",[53,3386,3387],{},[56,3388,3389],{},"RBAC + SSO\u002FSAML + Audit",[53,3391,3392],{},[56,3393,3394],{},"Hierarchical budgets + rate limits",[53,3396,3397],{},[56,3398,1640],{},[53,3400,3401,3404],{},[56,3402,3403],{},"Compliance","：SOC2 Type 2 \u002F HIPAA \u002F GDPR \u002F ISO 27001（Enterprise）",[53,3406,3407,3410],{},[56,3408,3409],{},"部署","：SaaS \u002F 私有云 \u002F VPC \u002F on-prem（Enterprise）",[53,3412,3413,3416],{},[56,3414,3415],{},"Open Source Gateway","：MIT 协议，可自托管纯路由层",[30,3418,122],{"id":122},[50,3420,3421,3427,3433,3438,3443],{},[53,3422,3423,3426],{},[56,3424,3425],{},"Developer Free","：10K logs\u002F月 + 3 天 retention + 基础功能",[53,3428,3429,3432],{},[56,3430,3431],{},"Production","：$49\u002F月（早期媒体引用 $79 已下调）+ 100K logs + $9\u002F100K 超量（最高 3M）+ 30 天 retention + 语义缓存 + RBAC + Guardrails",[53,3434,3435,3437],{},[56,3436,899],{},"：联系销售（更高 log 配额 + 团队治理 + 更长 retention）",[53,3439,3440,3442],{},[56,3441,905],{},"：Custom（业界估 $5K–$10K+\u002F月）+ 10M+ logs + 自定义 retention + 全套合规 + SSO + 私有云",[53,3444,3445,3447],{},[56,3446,3415],{},"：$0 自托管 MIT",[138,3449,3450],{},[35,3451,3452],{},"真实成本陷阱：超过 Production 100K logs 后 $9\u002F100K 累计快，月 1M 请求 ≈ $49 + 9 × 9 ≈ $130。",[30,3454,3456],{"id":3455},"实测中型-saas-series-b-团队","实测（中型 SaaS \u002F Series B 团队）",[35,3458,3459],{},[56,3460,151],{},[50,3462,3463,3466,3469,3472,3475,3478],{},[53,3464,3465],{},"2 分钟改 baseURL 接入，立即看到所有 LLM 调用",[53,3467,3468],{},"40+ 维度 dashboard 让 FinOps 团队第一次能拍预算",[53,3470,3471],{},"conditional routing 让『便宜模型先试 + 失败 fallback 贵模型』容易实现",[53,3473,3474],{},"MCP Gateway 给团队的 agent 工具调用上了治理",[53,3476,3477],{},"SOC 2 Type 2 + HIPAA 让合规过审快",[53,3479,3480],{},"Auto-instrumentation 帮 LangChain \u002F LlamaIndex 应用零代码改造",[35,3482,3483],{},[56,3484,181],{},[50,3486,3487,3490,3493,3496,3499,3501,3504],{},[53,3488,3489],{},"按 recorded logs 计费让用量突增时账单失控",[53,3491,3492],{},"Tracing 深度不如 Langfuse 的 nested span（复杂 agent 调试不够）",[53,3494,3495],{},"模型价格表对部分模型不全 \u002F air-gapped 部署需手动维护",[53,3497,3498],{},"文档对高级配置存在 gap，社区反馈一致",[53,3500,969],{},[53,3502,3503],{},"log retention 30 天上限不动 Enterprise 解决",[53,3505,3506],{},"PANW 收购后路线图 \u002F 定价变动是评估风险",[30,3508,975],{"id":975},[213,3510,3512],{"className":978,"code":3511,"language":980,"meta":218,"style":218},"from portkey_ai import Portkey\n\nclient = Portkey(\n    api_key=\"YOUR_PORTKEY_KEY\",\n    virtual_key=\"OPENAI_VIRTUAL_KEY\",\n    config={\n        \"strategy\": {\"mode\": \"fallback\"},\n        \"targets\": [\n            {\"virtual_key\": \"OPENAI_VK\"},\n            {\"virtual_key\": \"ANTHROPIC_VK\"}\n        ],\n        \"cache\": {\"mode\": \"semantic\"}\n    }\n)\n\nresp = client.chat.completions.create(\n    model=\"gpt-5.4\",\n    messages=[...]\n)\n# Portkey dashboard 自动看到完整 trace + cost + latency\n",[39,3513,3514,3527,3531,3540,3551,3563,3572,3591,3599,3614,3628,3633,3649,3653,3657,3661,3671,3683,3699,3704],{"__ignoreMap":218},[222,3515,3516,3519,3522,3524],{"class":224,"line":225},[222,3517,3518],{"class":992},"from",[222,3520,3521],{"class":295}," portkey_ai ",[222,3523,993],{"class":992},[222,3525,3526],{"class":295}," Portkey\n",[222,3528,3529],{"class":224,"line":232},[222,3530,313],{"emptyLinePlaceholder":312},[222,3532,3533,3535,3537],{"class":224,"line":268},[222,3534,1001],{"class":295},[222,3536,1004],{"class":992},[222,3538,3539],{"class":295}," Portkey(\n",[222,3541,3542,3544,3546,3549],{"class":224,"line":279},[222,3543,1026],{"class":1012},[222,3545,1004],{"class":992},[222,3547,3548],{"class":239},"\"YOUR_PORTKEY_KEY\"",[222,3550,1021],{"class":295},[222,3552,3553,3556,3558,3561],{"class":224,"line":289},[222,3554,3555],{"class":1012},"    virtual_key",[222,3557,1004],{"class":992},[222,3559,3560],{"class":239},"\"OPENAI_VIRTUAL_KEY\"",[222,3562,1021],{"class":295},[222,3564,3565,3568,3570],{"class":224,"line":304},[222,3566,3567],{"class":1012},"    config",[222,3569,1004],{"class":992},[222,3571,1043],{"class":295},[222,3573,3574,3577,3580,3583,3585,3588],{"class":224,"line":5},[222,3575,3576],{"class":239},"        \"strategy\"",[222,3578,3579],{"class":295},": {",[222,3581,3582],{"class":239},"\"mode\"",[222,3584,1051],{"class":295},[222,3586,3587],{"class":239},"\"fallback\"",[222,3589,3590],{"class":295},"},\n",[222,3592,3593,3596],{"class":224,"line":8},[222,3594,3595],{"class":239},"        \"targets\"",[222,3597,3598],{"class":295},": [\n",[222,3600,3601,3604,3607,3609,3612],{"class":224,"line":321},[222,3602,3603],{"class":295},"            {",[222,3605,3606],{"class":239},"\"virtual_key\"",[222,3608,1051],{"class":295},[222,3610,3611],{"class":239},"\"OPENAI_VK\"",[222,3613,3590],{"class":295},[222,3615,3616,3618,3620,3622,3625],{"class":224,"line":7},[222,3617,3603],{"class":295},[222,3619,3606],{"class":239},[222,3621,1051],{"class":295},[222,3623,3624],{"class":239},"\"ANTHROPIC_VK\"",[222,3626,3627],{"class":295},"}\n",[222,3629,3630],{"class":224,"line":332},[222,3631,3632],{"class":295},"        ],\n",[222,3634,3635,3638,3640,3642,3644,3647],{"class":224,"line":338},[222,3636,3637],{"class":239},"        \"cache\"",[222,3639,3579],{"class":295},[222,3641,3582],{"class":239},[222,3643,1051],{"class":295},[222,3645,3646],{"class":239},"\"semantic\"",[222,3648,3627],{"class":295},[222,3650,3651],{"class":224,"line":344},[222,3652,1092],{"class":295},[222,3654,3655],{"class":224,"line":350},[222,3656,1097],{"class":295},[222,3658,3659],{"class":224,"line":356},[222,3660,313],{"emptyLinePlaceholder":312},[222,3662,3663,3666,3668],{"class":224,"line":1889},[222,3664,3665],{"class":295},"resp ",[222,3667,1004],{"class":992},[222,3669,3670],{"class":295}," client.chat.completions.create(\n",[222,3672,3673,3676,3678,3681],{"class":224,"line":1899},[222,3674,3675],{"class":1012},"    model",[222,3677,1004],{"class":992},[222,3679,3680],{"class":239},"\"gpt-5.4\"",[222,3682,1021],{"class":295},[222,3684,3685,3688,3690,3693,3696],{"class":224,"line":1909},[222,3686,3687],{"class":1012},"    messages",[222,3689,1004],{"class":992},[222,3691,3692],{"class":295},"[",[222,3694,3695],{"class":243},"...",[222,3697,3698],{"class":295},"]\n",[222,3700,3702],{"class":224,"line":3701},19,[222,3703,1097],{"class":295},[222,3705,3707],{"class":224,"line":3706},20,[222,3708,3709],{"class":228},"# Portkey dashboard 自动看到完整 trace + cost + latency\n",[30,3711,362],{"id":362},[364,3713,3714,3728],{},[367,3715,3716],{},[370,3717,3718,3720,3722,3724,3726],{},[373,3719,375],{},[373,3721,1163],{},[373,3723,782],{},[373,3725,1160],{},[373,3727,383],{},[388,3729,3730,3746,3762,3775,3787,3802,3817,3831,3846,3861,3876],{},[370,3731,3732,3734,3737,3740,3743],{},[393,3733,1939],{},[393,3735,3736],{},"Gateway+Obs SaaS",[393,3738,3739],{},"Proxy Obs",[393,3741,3742],{},"SDK Tracing",[393,3744,3745],{},"OSS Gateway",[370,3747,3748,3751,3754,3756,3759],{},[393,3749,3750],{},"集成",[393,3752,3753],{},"改 baseURL（分钟）",[393,3755,3753],{},[393,3757,3758],{},"代码改造（小时）",[393,3760,3761],{},"自托管（小时）",[370,3763,3764,3766,3768,3771,3773],{},[393,3765,1197],{},[393,3767,1206],{},[393,3769,3770],{},"浅",[393,3772,1203],{},[393,3774,406],{},[370,3776,3777,3779,3781,3783,3785],{},[393,3778,1211],{},[393,3780,1219],{},[393,3782,414],{},[393,3784,414],{},[393,3786,417],{},[370,3788,3789,3792,3795,3798,3800],{},[393,3790,3791],{},"Auto fallback",[393,3793,3794],{},"✅ chains",[393,3796,3797],{},"✅ 基础",[393,3799,414],{},[393,3801,417],{},[370,3803,3804,3807,3809,3812,3814],{},[393,3805,3806],{},"Semantic caching",[393,3808,417],{},[393,3810,3811],{},"proxy 级",[393,3813,414],{},[393,3815,3816],{},"Redis",[370,3818,3819,3822,3825,3827,3829],{},[393,3820,3821],{},"MCP Gateway",[393,3823,3824],{},"✅ GA",[393,3826,414],{},[393,3828,414],{},[393,3830,414],{},[370,3832,3833,3835,3838,3841,3844],{},[393,3834,865],{},[393,3836,3837],{},"Enterprise \u002F OSS Gateway",[393,3839,3840],{},"Enterprise（已收购）",[393,3842,3843],{},"✅ 免费无限",[393,3845,417],{},[370,3847,3848,3850,3853,3856,3859],{},[393,3849,871],{},[393,3851,3852],{},"SOC2 + HIPAA + GDPR + ISO27001",[393,3854,3855],{},"SOC2 + HIPAA",[393,3857,3858],{},"SOC2",[393,3860,417],{},[370,3862,3863,3866,3869,3871,3874],{},[393,3864,3865],{},"起价",[393,3867,3868],{},"$49\u002F月",[393,3870,1499],{},[393,3872,3873],{},"$29\u002F月",[393,3875,743],{},[370,3877,3878,3881,3884,3887,3890],{},[393,3879,3880],{},"免费配额",[393,3882,3883],{},"10K logs",[393,3885,3886],{},"10K req",[393,3888,3889],{},"50K events",[393,3891,406],{},[30,3893,542],{"id":542},[50,3895,3896,3902,3908,3914,3920,3926,3932,3938],{},[53,3897,3898,3901],{},[56,3899,3900],{},"按 logs 计费要设报警","：超量 $9\u002F100K 容易爆账单",[53,3903,3904,3907],{},[56,3905,3906],{},"PANW 收购变量","：评估时把定价 \u002F 路线图 \u002F API 变动写进风险",[53,3909,3910,3913],{},[56,3911,3912],{},"Tracing 不深够用就好","：复杂 agent 调试要叠 Langfuse",[53,3915,3916,3919],{},[56,3917,3918],{},"Production tier retention 30 天","：超长归档要 Enterprise",[53,3921,3922,3925],{},[56,3923,3924],{},"Air-gapped 价格表","：部分模型成本要手动维护",[53,3927,3928,3931],{},[56,3929,3930],{},"Virtual Key 别裸暴露","：客户端调用务必走 server-side proxy",[53,3933,3934,3937],{},[56,3935,3936],{},"Conditional routing 别写太复杂","：3+ 层条件路由调试痛苦",[53,3939,3940,3943],{},[56,3941,3942],{},"Open Source Gateway != 企业版","：自托管开源版缺 governance \u002F dashboards \u002F evals",[30,3945,601],{"id":600},[50,3947,3948,3951,3954,3957,3960,3963,3966,3969,3972],{},[53,3949,3950],{},"✅ 中大型团队从 PoC 走向生产",[53,3952,3953],{},"✅ 强合规（SOC2 Type 2 + HIPAA + GDPR + ISO27001）",[53,3955,3956],{},"✅ 多团队 RBAC + 预算治理",[53,3958,3959],{},"✅ 大规模 AI agent 部署 + MCP 工具治理",[53,3961,3962],{},"✅ 想要『网关 + 观测』一体化 SaaS",[53,3964,3965],{},"❌ 深度 nested span 调试（用 Langfuse）",[53,3967,3968],{},"❌ 纯网关不要观测（用 LiteLLM）",[53,3970,3971],{},"❌ 中文运营 \u002F 中文支付（用 one-api \u002F new-api）",[53,3973,3974],{},"❌ 极小预算项目（Helicone Hobby \u002F Langfuse Free 更划算）",[30,3976,633],{"id":633},[50,3978,3979,3983,3987,3991],{},[53,3980,3981],{},[639,3982,656],{"href":24},[53,3984,3985],{},[639,3986,641],{"href":15},[53,3988,3989],{},[639,3990,646],{"href":18},[53,3992,3993],{},[639,3994,1419],{"href":730},[30,3996,659],{"id":659},[661,3998,3999,4006,4013,4019],{},[53,4000,4001,4002],{},"Portkey 官网 — Observability 全栈观测 + Palo Alto Networks 收购公告 ",[639,4003,4004],{"href":4004,"rel":4005},"https:\u002F\u002Fportkey.ai\u002Ffeatures\u002Fobservability",[670],[53,4007,4008,4009],{},"TrueFoundry — Portkey AI Gateway Pricing Guide 2026 ",[639,4010,4011],{"href":4011,"rel":4012},"https:\u002F\u002Fwww.truefoundry.com\u002Fblog\u002Fportkey-pricing-guide",[670],[53,4014,4015,4016],{},"BuildMVPFast — Langfuse vs Helicone vs Portkey 对比 ",[639,4017,1457],{"href":1457,"rel":4018},[670],[53,4020,4021,4022],{},"DevTune — Portkey AI 评测 + 定价 + Gartner Cool Vendor ",[639,4023,4024],{"href":4024,"rel":4025},"https:\u002F\u002Fdevtune.ai\u002Fverticals\u002Fllm-observability-evals-gateways\u002Fportkey",[670],[693,4027,4028],{},"html pre.shiki code .szBVR, html code.shiki .szBVR{--shiki-default:#D73A49;--shiki-dark:#F97583}html pre.shiki code .sVt8B, html code.shiki .sVt8B{--shiki-default:#24292E;--shiki-dark:#E1E4E8}html pre.shiki code .s4XuR, html code.shiki .s4XuR{--shiki-default:#E36209;--shiki-dark:#FFAB70}html pre.shiki code .sZZnC, html code.shiki .sZZnC{--shiki-default:#032F62;--shiki-dark:#9ECBFF}html pre.shiki code .sj4cs, html code.shiki .sj4cs{--shiki-default:#005CC5;--shiki-dark:#79B8FF}html pre.shiki code .sJ8bj, html code.shiki .sJ8bj{--shiki-default:#6A737D;--shiki-dark:#6A737D}html .default .shiki span {color: var(--shiki-default);background: var(--shiki-default-bg);font-style: var(--shiki-default-font-style);font-weight: var(--shiki-default-font-weight);text-decoration: var(--shiki-default-text-decoration);}html .shiki span {color: var(--shiki-default);background: var(--shiki-default-bg);font-style: var(--shiki-default-font-style);font-weight: var(--shiki-default-font-weight);text-decoration: var(--shiki-default-text-decoration);}html .dark .shiki span {color: var(--shiki-dark);background: var(--shiki-dark-bg);font-style: var(--shiki-dark-font-style);font-weight: var(--shiki-dark-font-weight);text-decoration: var(--shiki-dark-text-decoration);}html.dark .shiki span {color: var(--shiki-dark);background: var(--shiki-dark-bg);font-style: var(--shiki-dark-font-style);font-weight: var(--shiki-dark-font-weight);text-decoration: var(--shiki-dark-text-decoration);}",{"title":218,"searchDepth":268,"depth":268,"links":4030},[4031,4032,4033,4034,4035,4036,4037,4038,4039,4040],{"id":32,"depth":232,"text":33},{"id":48,"depth":232,"text":48},{"id":122,"depth":232,"text":122},{"id":3455,"depth":232,"text":3456},{"id":975,"depth":232,"text":975},{"id":362,"depth":232,"text":362},{"id":542,"depth":232,"text":542},{"id":600,"depth":232,"text":601},{"id":633,"depth":232,"text":633},{"id":659,"depth":232,"text":659},"\u002Fimg\u002Ftools\u002Fportkey.webp","Portkey 真实评测：250+ 模型统一 AI 网关 + 全栈观测 + MCP Gateway。2026 被 Palo Alto Networks 收购。免费 10K logs\u002F月，Production $49\u002F月（100K logs + 30 天 retention），Team 大体量，Enterprise SOC2 Type 2 + HIPAA + GDPR + ISO 27001 + 私有云 \u002F VPC + 1T tokens\u002F天里程碑。",[4044,4047,4050,4053],{"q":4045,"a":4046},"Portkey 收购了？","2026 年 Palo Alto Networks 完成收购 Portkey，作为其『保护 AI agent 崛起』战略的一部分。产品继续运营 + 1T tokens\u002F天里程碑达成；对企业买家是利好（背靠 Palo Alto 安全 + 合规背书），但社区担忧定价 \u002F 路线图变化——评估时要把『被 PANW 整合』作为风险项。",{"q":4048,"a":4049},"Recorded logs 是什么计量？","Portkey 不按请求 \u002F token 计费，而是按『记录到观测系统的日志条数』。一次 API 调用 = 一条 log（不含 retries）。100K logs 是『被采集 100K 次请求』的容量，不是『LLM 100K 调用配额』——LLM 费用走你自己付。",{"q":4051,"a":4052},"自托管选项？","Portkey 开源了核心 AI Gateway（GitHub Star 10K+，MIT），可以自托管做纯路由 + 基础观测；但企业级功能（SOC2 \u002F 自动 evals \u002F 团队治理 \u002F governance dashboard）只在 SaaS 或 Enterprise on-prem 提供。",{"q":4054,"a":4055},"MCP Gateway 是什么？","面向 AI agent 的 MCP（Model Context Protocol）统一访问层，已 GA。每次 agent 调工具都自动记录工具名 \u002F 参数 \u002F 响应 \u002F 用户 \u002F 团队 \u002F 延迟 \u002F 状态，是大规模 agent 部署里『谁的 agent 在做什么』可追溯的关键基础设施。",[728],{},[1492,708,1493],[4060,4064,4067,4071],{"plan":4061,"price":743,"features":4062,"notes":4063},"Developer","10K recorded logs\u002F月 + 3 天 retention + 社区支持 + 基础 fallback","PoC \u002F hobby \u002F 小项目",{"plan":3431,"price":3868,"features":4065,"notes":4066},"100K logs\u002F月 + $9\u002F100K 超量（最高 3M）+ 30 天 retention + 语义缓存 + RBAC + Guardrails + 生产支持","中小生产应用",{"plan":899,"price":4068,"features":4069,"notes":4070},"联系销售","更高 log 配额 + 团队治理 + 更长 retention","中型组织",{"plan":905,"price":4072,"features":4073,"notes":4074},"Custom（$5K–$10K+\u002F月）","10M+ logs + 自定义 retention + SSO\u002FSAML + 私有云\u002FVPC + SOC2 Type 2 + HIPAA + GDPR + ISO 27001 + 单租户","大企业 \u002F 强合规","Developer 免费 10K logs\u002F月 \u002F Production $49\u002F月 100K logs \u002F Team 大体量 \u002F Enterprise 定制",[4077],{"name":1513,"url":1514},{"power":289,"ux":279,"price":268,"cn_support":232,"stability":279},{"title":1163,"description":4042},"coding\u002Fapi\u002Fportkey",[4082,4084,4086,4087],{"name":4083,"url":4004,"accessed":757},"Portkey 官网 — Observability 功能",{"name":4085,"url":4011,"accessed":757},"TrueFoundry — Portkey Pricing Guide 2026",{"name":1528,"url":1457,"accessed":757},{"name":4088,"url":4024,"accessed":757},"DevTune — Portkey AI 评测 + 定价","tools\u002Fcoding\u002Fapi\u002Fportkey","Control Panel for Production AI——AI 网关 + 全栈观测 + MCP 网关，2026 被 Palo Alto Networks 收购",[767,4092,4093,4094,4095,1536,1537],"observability","mcp","governance","enterprise","网关 + 观测一体化最完整的 SaaS。中大型团队从 PoC 走向生产、要 SOC2\u002FHIPAA\u002FMCP\u002F治理走 Portkey。纯观测 → Helicone\u002FLangfuse；自托管控制成本 → LiteLLM + Langfuse。","https:\u002F\u002Fportkey.ai","Cn9cCfSk0-CNbWtnHGWslh2DNePBYyh3ddM9rA7GWRk",[],1782316490479]