[{"data":1,"prerenderedAt":941},["ShallowReactive",2],{"header-counts":3,"footer-counts":6,"model-claude-haiku-4":9},{"tools":4,"reviews":5},65,7,{"tools":4,"reviews":5,"playbooks":7,"news":8},10,8,{"id":10,"title":11,"apiCompatible":12,"benchmarks":14,"body":24,"category":907,"contextWindow":908,"description":909,"extension":910,"maxOutput":911,"meta":912,"navigation":179,"path":913,"pricing":914,"published":915,"relatedTools":916,"releaseDate":919,"seo":920,"slug":921,"stem":922,"strengths":923,"updated":915,"useCases":929,"vendor":934,"vendorEn":934,"weaknesses":935,"__hash__":940},"models\u002Fmodels\u002Fclaude-haiku-4.md","Claude Haiku 4",[13],"anthropic",[15,18,21],{"name":16,"score":17},"SWE-bench Verified","56.1%",{"name":19,"score":20},"HumanEval","87.1%",{"name":22,"score":23},"MMLU","83.4%",{"type":25,"value":26,"toc":888},"minimark",[27,31,35,38,42,45,48,104,107,110,114,117,121,129,133,306,310,313,487,490,493,564,567,583,587,590,604,607,611,693,700,703,782,786,789,806,809,823,826,852,855,884],[28,29,30],"h2",{"id":30},"概述",[32,33,34],"p",{},"Claude Haiku 4 是 Anthropic 于 2025 年 5 月与 Sonnet 4 \u002F Opus 4 同步发布的轻量模型。定位为\"快速 + 低成本\"选项，速度是 Sonnet 4 的 3 倍，价格仅 1\u002F3。",[28,36,37],{"id":37},"核心能力",[39,40,41],"h3",{"id":41},"极速响应",[32,43,44],{},"Haiku 4 的首 token 延迟约 0.5 秒，是 Sonnet 4 的 1\u002F3。对于实时代码补全、流式聊天等场景，这个速度差异至关重要。",[32,46,47],{},"实测吞吐：",[49,50,51,67],"table",{},[52,53,54],"thead",{},[55,56,57,61,64],"tr",{},[58,59,60],"th",{},"场景",[58,62,63],{},"Haiku 4",[58,65,66],{},"Sonnet 4",[68,69,70,82,93],"tbody",{},[55,71,72,76,79],{},[73,74,75],"td",{},"首 token 延迟",[73,77,78],{},"~0.5s",[73,80,81],{},"~1.5s",[55,83,84,87,90],{},[73,85,86],{},"流式吞吐",[73,88,89],{},"~80 tok\u002Fs",[73,91,92],{},"~50 tok\u002Fs",[55,94,95,98,101],{},[73,96,97],{},"1K 字回答总时长",[73,99,100],{},"~2s",[73,102,103],{},"~6s",[39,105,106],{"id":106},"编程能力不打折",[32,108,109],{},"SWE-bench Verified 56.1%，远超同价位的 GPT-4o-mini（33.2%）和 Gemini Flash（43.8%）。在代码补全场景下，Haiku 4 的体验接近 Sonnet 4 的 80%。",[39,111,113],{"id":112},"_200k-上下文","200K 上下文",[32,115,116],{},"与 Sonnet 4 共享 200K 上下文窗口。可以用低成本处理长文档、全文件分析等任务。",[39,118,120],{"id":119},"prompt-cache-仍然支持","Prompt Cache 仍然支持",[32,122,123,124,128],{},"Haiku 4 同样支持 prompt cache，Cache Read 价格只有 $0.10\u002FM——便宜到几乎可以忽略。",[125,126,127],"strong",{},"高频固定 prompt 场景务必开启","。",[28,130,132],{"id":131},"api-调用示例","API 调用示例",[134,135,140],"pre",{"className":136,"code":137,"language":138,"meta":139,"style":139},"language-python shiki shiki-themes github-light github-dark","from anthropic import Anthropic\nclient = Anthropic()\n\n# 极致速度场景：流式 + 短 max_tokens\nwith client.messages.stream(\n    model=\"claude-haiku-4-20250522\",\n    max_tokens=500,           # 不要默认 16K，限制输出长度提速\n    temperature=0,\n    messages=[{\"role\": \"user\", \"content\": prompt}],\n) as stream:\n    for text in stream.text_stream:\n        yield text\n","python","",[141,142,143,162,174,181,188,197,213,230,242,271,282,297],"code",{"__ignoreMap":139},[144,145,148,152,156,159],"span",{"class":146,"line":147},"line",1,[144,149,151],{"class":150},"szBVR","from",[144,153,155],{"class":154},"sVt8B"," anthropic ",[144,157,158],{"class":150},"import",[144,160,161],{"class":154}," Anthropic\n",[144,163,165,168,171],{"class":146,"line":164},2,[144,166,167],{"class":154},"client ",[144,169,170],{"class":150},"=",[144,172,173],{"class":154}," Anthropic()\n",[144,175,177],{"class":146,"line":176},3,[144,178,180],{"emptyLinePlaceholder":179},true,"\n",[144,182,184],{"class":146,"line":183},4,[144,185,187],{"class":186},"sJ8bj","# 极致速度场景：流式 + 短 max_tokens\n",[144,189,191,194],{"class":146,"line":190},5,[144,192,193],{"class":150},"with",[144,195,196],{"class":154}," client.messages.stream(\n",[144,198,200,204,206,210],{"class":146,"line":199},6,[144,201,203],{"class":202},"s4XuR","    model",[144,205,170],{"class":150},[144,207,209],{"class":208},"sZZnC","\"claude-haiku-4-20250522\"",[144,211,212],{"class":154},",\n",[144,214,215,218,220,224,227],{"class":146,"line":5},[144,216,217],{"class":202},"    max_tokens",[144,219,170],{"class":150},[144,221,223],{"class":222},"sj4cs","500",[144,225,226],{"class":154},",           ",[144,228,229],{"class":186},"# 不要默认 16K，限制输出长度提速\n",[144,231,232,235,237,240],{"class":146,"line":8},[144,233,234],{"class":202},"    temperature",[144,236,170],{"class":150},[144,238,239],{"class":222},"0",[144,241,212],{"class":154},[144,243,245,248,250,253,256,259,262,265,268],{"class":146,"line":244},9,[144,246,247],{"class":202},"    messages",[144,249,170],{"class":150},[144,251,252],{"class":154},"[{",[144,254,255],{"class":208},"\"role\"",[144,257,258],{"class":154},": ",[144,260,261],{"class":208},"\"user\"",[144,263,264],{"class":154},", ",[144,266,267],{"class":208},"\"content\"",[144,269,270],{"class":154},": prompt}],\n",[144,272,273,276,279],{"class":146,"line":7},[144,274,275],{"class":154},") ",[144,277,278],{"class":150},"as",[144,280,281],{"class":154}," stream:\n",[144,283,285,288,291,294],{"class":146,"line":284},11,[144,286,287],{"class":150},"    for",[144,289,290],{"class":154}," text ",[144,292,293],{"class":150},"in",[144,295,296],{"class":154}," stream.text_stream:\n",[144,298,300,303],{"class":146,"line":299},12,[144,301,302],{"class":150},"        yield",[144,304,305],{"class":154}," text\n",[39,307,309],{"id":308},"批量处理batch-api","批量处理（Batch API）",[32,311,312],{},"Haiku 4 配合 Anthropic Batch API，价格再 -50%（变成 Input $0.5\u002FM · Output $2.5\u002FM），24 小时内返回。适合：",[134,314,316],{"className":136,"code":315,"language":138,"meta":139,"style":139},"# 提交 10000 条要分类的文本\nbatch = client.messages.batches.create(\n    requests=[\n        {\n            \"custom_id\": f\"task-{i}\",\n            \"params\": {\n                \"model\": \"claude-haiku-4-20250522\",\n                \"max_tokens\": 100,\n                \"messages\": [{\"role\": \"user\", \"content\": f\"分类：{text}\"}],\n            }\n        }\n        for i, text in enumerate(texts)\n    ]\n)\n# 轮询 batch.id 直到 status='ended'\n",[141,317,318,323,333,343,348,375,383,394,406,443,448,453,469,475,481],{"__ignoreMap":139},[144,319,320],{"class":146,"line":147},[144,321,322],{"class":186},"# 提交 10000 条要分类的文本\n",[144,324,325,328,330],{"class":146,"line":164},[144,326,327],{"class":154},"batch ",[144,329,170],{"class":150},[144,331,332],{"class":154}," client.messages.batches.create(\n",[144,334,335,338,340],{"class":146,"line":176},[144,336,337],{"class":202},"    requests",[144,339,170],{"class":150},[144,341,342],{"class":154},"[\n",[144,344,345],{"class":146,"line":183},[144,346,347],{"class":154},"        {\n",[144,349,350,353,355,358,361,364,367,370,373],{"class":146,"line":190},[144,351,352],{"class":208},"            \"custom_id\"",[144,354,258],{"class":154},[144,356,357],{"class":150},"f",[144,359,360],{"class":208},"\"task-",[144,362,363],{"class":222},"{",[144,365,366],{"class":154},"i",[144,368,369],{"class":222},"}",[144,371,372],{"class":208},"\"",[144,374,212],{"class":154},[144,376,377,380],{"class":146,"line":199},[144,378,379],{"class":208},"            \"params\"",[144,381,382],{"class":154},": {\n",[144,384,385,388,390,392],{"class":146,"line":5},[144,386,387],{"class":208},"                \"model\"",[144,389,258],{"class":154},[144,391,209],{"class":208},[144,393,212],{"class":154},[144,395,396,399,401,404],{"class":146,"line":8},[144,397,398],{"class":208},"                \"max_tokens\"",[144,400,258],{"class":154},[144,402,403],{"class":222},"100",[144,405,212],{"class":154},[144,407,408,411,414,416,418,420,422,424,426,428,431,433,436,438,440],{"class":146,"line":244},[144,409,410],{"class":208},"                \"messages\"",[144,412,413],{"class":154},": [{",[144,415,255],{"class":208},[144,417,258],{"class":154},[144,419,261],{"class":208},[144,421,264],{"class":154},[144,423,267],{"class":208},[144,425,258],{"class":154},[144,427,357],{"class":150},[144,429,430],{"class":208},"\"分类：",[144,432,363],{"class":222},[144,434,435],{"class":154},"text",[144,437,369],{"class":222},[144,439,372],{"class":208},[144,441,442],{"class":154},"}],\n",[144,444,445],{"class":146,"line":7},[144,446,447],{"class":154},"            }\n",[144,449,450],{"class":146,"line":284},[144,451,452],{"class":154},"        }\n",[144,454,455,458,461,463,466],{"class":146,"line":299},[144,456,457],{"class":150},"        for",[144,459,460],{"class":154}," i, text ",[144,462,293],{"class":150},[144,464,465],{"class":222}," enumerate",[144,467,468],{"class":154},"(texts)\n",[144,470,472],{"class":146,"line":471},13,[144,473,474],{"class":154},"    ]\n",[144,476,478],{"class":146,"line":477},14,[144,479,480],{"class":154},")\n",[144,482,484],{"class":146,"line":483},15,[144,485,486],{"class":186},"# 轮询 batch.id 直到 status='ended'\n",[32,488,489],{},"万级任务用 Batch 一晚就出，成本是单条同步调用的 1\u002F2。",[28,491,492],{"id":492},"定价",[49,494,495,509],{},[52,496,497],{},[55,498,499,502,504,506],{},[58,500,501],{},"项目",[58,503,63],{},[58,505,66],{},[58,507,508],{},"倍数",[68,510,511,525,538,551],{},[55,512,513,516,519,522],{},[73,514,515],{},"Input",[73,517,518],{},"$1\u002FM",[73,520,521],{},"$3\u002FM",[73,523,524],{},"3×",[55,526,527,530,533,536],{},[73,528,529],{},"Output",[73,531,532],{},"$5\u002FM",[73,534,535],{},"$15\u002FM",[73,537,524],{},[55,539,540,543,546,549],{},[73,541,542],{},"Cache Read",[73,544,545],{},"$0.10\u002FM",[73,547,548],{},"$0.30\u002FM",[73,550,524],{},[55,552,553,556,559,562],{},[73,554,555],{},"Batch（-50%）",[73,557,558],{},"$0.5\u002F$2.5",[73,560,561],{},"$1.5\u002F$7.5",[73,563,524],{},[32,565,566],{},"一个月用 10 亿 token（Input\u002FOutput 各半）：",[568,569,570,574,577,580],"ul",{},[571,572,573],"li",{},"Sonnet 4: $9,000",[571,575,576],{},"Haiku 4: $3,000",[571,578,579],{},"Haiku 4 + 50% cache: $1,650",[571,581,582],{},"Haiku 4 + Batch: $1,500",[28,584,586],{"id":585},"在-cursor-ide-中的角色","在 Cursor \u002F IDE 中的角色",[32,588,589],{},"Cursor \u002F Windsurf 等 IDE 内部通常分两档模型：",[568,591,592,598],{},[571,593,594,597],{},[125,595,596],{},"Tab 自动补全 \u002F Cmd+K 小改动"," → 用 Haiku 4 这类速度优先模型",[571,599,600,603],{},[125,601,602],{},"Composer 多文件改写 \u002F Agent"," → 用 Sonnet 4 这类质量优先模型",[32,605,606],{},"如果你自建 IDE 集成，参考这个分层。",[28,608,610],{"id":609},"haiku-4-vs-同价位竞品","Haiku 4 vs 同价位竞品",[49,612,613,630],{},[52,614,615],{},[55,616,617,620,622,624,627],{},[58,618,619],{},"模型",[58,621,515],{},[58,623,529],{},[58,625,626],{},"SWE-bench",[58,628,629],{},"速度",[68,631,632,645,661,676],{},[55,633,634,636,638,640,642],{},[73,635,11],{},[73,637,518],{},[73,639,532],{},[73,641,17],{},[73,643,644],{},"★★★★★",[55,646,647,650,653,656,659],{},[73,648,649],{},"GPT-4o-mini",[73,651,652],{},"$0.15\u002FM",[73,654,655],{},"$0.60\u002FM",[73,657,658],{},"33.2%",[73,660,644],{},[55,662,663,666,669,671,674],{},[73,664,665],{},"Gemini 2.5 Flash",[73,667,668],{},"$0.075\u002FM",[73,670,548],{},[73,672,673],{},"43.8%",[73,675,644],{},[55,677,678,681,684,687,690],{},[73,679,680],{},"DeepSeek-V3",[73,682,683],{},"¥1\u002FM",[73,685,686],{},"¥2\u002FM",[73,688,689],{},"61.2%",[73,691,692],{},"★★★★☆",[32,694,695,696,699],{},"GPT-4o-mini \u002F Gemini Flash 便宜 5-10 倍，但 SWE-bench 差一大截。",[125,697,698],{},"Haiku 4 是\"轻量级里编程最强\"","，DeepSeek-V3 是\"国内便宜里编程最强\"。",[28,701,702],{"id":702},"三档模型怎么选",[49,704,705,717],{},[52,706,707],{},[55,708,709,711,714],{},[58,710,60],{},[58,712,713],{},"推荐",[58,715,716],{},"理由",[68,718,719,729,739,750,761,771],{},[55,720,721,724,726],{},[73,722,723],{},"代码补全\u002F实时建议",[73,725,63],{},[73,727,728],{},"速度优先",[55,730,731,734,736],{},[73,732,733],{},"主力编程\u002F代码审查",[73,735,66],{},[73,737,738],{},"质量优先",[55,740,741,744,747],{},[73,742,743],{},"深度推理\u002F长文写作",[73,745,746],{},"Opus 4",[73,748,749],{},"能力优先",[55,751,752,755,758],{},[73,753,754],{},"批量处理 10 万条数据",[73,756,757],{},"Haiku 4 + Batch",[73,759,760],{},"成本优先",[55,762,763,766,768],{},[73,764,765],{},"Agent 多步工具调用",[73,767,66],{},[73,769,770],{},"稳定性优先",[55,772,773,776,779],{},[73,774,775],{},"国内项目预算敏感",[73,777,778],{},"GLM-5.2 \u002F DeepSeek-V3",[73,780,781],{},"直连且更便宜",[28,783,785],{"id":784},"适用-不适用清单","适用 \u002F 不适用清单",[32,787,788],{},"✅ 适合：",[568,790,791,794,797,800,803],{},[571,792,793],{},"代码自动补全（Cursor Tab \u002F Copilot 风格）",[571,795,796],{},"实时聊天机器人 \u002F 客服",[571,798,799],{},"大批量分类 \u002F 抽取 \u002F 摘要",[571,801,802],{},"工具调用前置的简单 router 模型",[571,804,805],{},"日志解析 \u002F 语义提取",[32,807,808],{},"❌ 不适合：",[568,810,811,814,817,820],{},[571,812,813],{},"复杂多步推理（用 Sonnet 4 \u002F Opus 4）",[571,815,816],{},"多文件代码重构（用 Sonnet 4）",[571,818,819],{},"长文写作（16K 输出窗口不够）",[571,821,822],{},"法律 \u002F 医疗 \u002F 金融的严格场景（用 Opus 4）",[28,824,825],{"id":825},"避坑清单",[568,827,828,834,840,846],{},[571,829,830,833],{},[125,831,832],{},"别忘 max_tokens","：不显式设的话默认值很大，浪费速度和钱。",[571,835,836,839],{},[125,837,838],{},"16K 输出限制","：长文档处理时让模型分段输出。",[571,841,842,845],{},[125,843,844],{},"Cache 也要开","：哪怕 Haiku 已经很便宜，固定 prompt 部分 cache 后又能再省 50%。",[571,847,848,851],{},[125,849,850],{},"复杂任务不要硬凑","：模型选错宁可重路由也别让 Haiku 4 硬扛——你省的钱会在用户体验上还回去。",[28,853,854],{"id":854},"延伸阅读",[568,856,857,870,877],{},[571,858,859,860,865,866],{},"同系兄弟：",[861,862,864],"a",{"href":863},"\u002Fmodels\u002Fclaude-sonnet-4.html","Claude Sonnet 4"," \u002F ",[861,867,869],{"href":868},"\u002Fmodels\u002Fclaude-opus-4.html","Claude Opus 4",[571,871,872,873],{},"省钱原理：",[861,874,876],{"href":875},"\u002Fwiki\u002Ftoken.html","Token",[571,878,879,880],{},"速度优化：",[861,881,883],{"href":882},"\u002Fwiki\u002Fcontext-engineering.html","Context Engineering",[885,886,887],"style",{},"html pre.shiki code .szBVR, html code.shiki .szBVR{--shiki-default:#D73A49;--shiki-dark:#F97583}html pre.shiki code .sVt8B, html code.shiki .sVt8B{--shiki-default:#24292E;--shiki-dark:#E1E4E8}html pre.shiki code .sJ8bj, html code.shiki .sJ8bj{--shiki-default:#6A737D;--shiki-dark:#6A737D}html pre.shiki code .s4XuR, html code.shiki .s4XuR{--shiki-default:#E36209;--shiki-dark:#FFAB70}html pre.shiki code .sZZnC, html code.shiki .sZZnC{--shiki-default:#032F62;--shiki-dark:#9ECBFF}html pre.shiki code .sj4cs, html code.shiki .sj4cs{--shiki-default:#005CC5;--shiki-dark:#79B8FF}html .default .shiki span {color: var(--shiki-default);background: var(--shiki-default-bg);font-style: var(--shiki-default-font-style);font-weight: var(--shiki-default-font-weight);text-decoration: var(--shiki-default-text-decoration);}html .shiki span {color: var(--shiki-default);background: var(--shiki-default-bg);font-style: var(--shiki-default-font-style);font-weight: var(--shiki-default-font-weight);text-decoration: var(--shiki-default-text-decoration);}html .dark .shiki span {color: var(--shiki-dark);background: var(--shiki-dark-bg);font-style: var(--shiki-dark-font-style);font-weight: var(--shiki-dark-font-weight);text-decoration: var(--shiki-dark-text-decoration);}html.dark .shiki span {color: var(--shiki-dark);background: var(--shiki-dark-bg);font-style: var(--shiki-dark-font-style);font-weight: var(--shiki-dark-font-weight);text-decoration: var(--shiki-dark-text-decoration);}",{"title":139,"searchDepth":176,"depth":176,"links":889},[890,891,897,900,901,902,903,904,905,906],{"id":30,"depth":164,"text":30},{"id":37,"depth":164,"text":37,"children":892},[893,894,895,896],{"id":41,"depth":176,"text":41},{"id":106,"depth":176,"text":106},{"id":112,"depth":176,"text":113},{"id":119,"depth":176,"text":120},{"id":131,"depth":164,"text":132,"children":898},[899],{"id":308,"depth":176,"text":309},{"id":492,"depth":164,"text":492},{"id":585,"depth":164,"text":586},{"id":609,"depth":164,"text":610},{"id":702,"depth":164,"text":702},{"id":784,"depth":164,"text":785},{"id":825,"depth":164,"text":825},{"id":854,"depth":164,"text":854},"llm",200000,"Anthropic Claude Haiku 4 轻量快速模型，价格为 Sonnet 4 的 1\u002F3、推理速度约 3 倍，工具调用与指令跟随保持 Claude 家族水准，适合代码补全、IDE 实时辅助、批量处理与高并发 Agent 场景。","md",16384,{},"\u002Fmodels\u002Fclaude-haiku-4","Input $1\u002FM · Output $5\u002FM","2026-06-21",[917,918],"coding\u002Fide\u002Fcursor","coding\u002Fcli\u002Fclaude-code","2025-05-22",{"title":11,"description":909},"claude-haiku-4","models\u002Fclaude-haiku-4",[924,925,926,927,928],"速度极快，3 倍于 Sonnet 4","价格仅为 Sonnet 4 的 1\u002F3","200K 上下文，与 Sonnet 4 一致","编程能力远超同价位竞品","适合高并发、低延迟场景",[930,931,932,933],"代码补全（实时建议）","高并发客服 Bot","批量文本处理","轻量 Agent 任务","Anthropic",[936,937,938,939],"推理能力不如 Sonnet 4 \u002F Opus 4","复杂编程任务不如 Sonnet 4 稳定","16K 输出窗口偏短","国内无官方 API","-CLLhOK8SfSERewWRln2xOJCJJ7chSXi4gXInERf4pU",1782316489329]