[{"data":1,"prerenderedAt":-1},["ShallowReactive",2],{"pack-detail-translator-multilingual-stack-zh":3,"seo:pack:translator-multilingual-stack:zh":92},{"code":4,"message":5,"data":6},200,"操作成功",{"pack":7},{"slug":8,"icon":9,"tone":10,"status":11,"status_label":12,"title":13,"description":14,"items":15,"install_cmd":91},"translator-multilingual-stack","🌐","#0891B2","new","本周新建","译者的多语种栈","十个资产给真正在跑流水线的本地化工程师、译者和 i18n PM：抽取 → 术语表 → 翻译（LLM + NMT）→ 术语 QA → 回注。自托管 Weblate\u002FTolgee，LibreTranslate 兜底，Vale + LanguageTool 做 QA，PDFMathTranslate 和 KrillinAI 啃硬格式。",[16,28,35,41,49,56,63,70,77,84],{"id":17,"uuid":18,"slug":19,"title":20,"description":21,"author_name":22,"view_count":23,"vote_count":24,"lang_type":25,"type":26,"type_label":27},1776,"cb2ceff8-3bca-11f1-9bc6-00163e2b0d79","weblate-web-based-continuous-localization-platform-cb2ceff8","Weblate — Web-Based Continuous Localization Platform","A web-based translation management system with tight version control integration. Weblate automates the localization workflow with translation memory, machine translation, and quality checks.","AI Open Source",120,0,"en","skill","Skill",{"id":29,"uuid":30,"slug":31,"title":32,"description":33,"author_name":22,"view_count":34,"vote_count":24,"lang_type":25,"type":26,"type_label":27},2716,"5b96a366-48e2-11f1-9bc6-00163e2b0d79","tolgee-developer-friendly-localization-platform-5b96a366","Tolgee — Developer-Friendly Localization Platform","An open-source localization platform that lets developers and translators manage translations through a web UI, in-context editing, and native SDK integrations for React, Vue, Angular, and more.",105,{"id":36,"uuid":37,"slug":38,"title":39,"description":40,"author_name":22,"view_count":4,"vote_count":24,"lang_type":25,"type":26,"type_label":27},1336,"3109a712-381e-11f1-9bc6-00163e2b0d79","libretranslate-self-hosted-translation-api-no-rate-limits-3109a712","LibreTranslate — Self-Hosted Translation API with No Rate Limits","LibreTranslate is a self-hostable translation API powered by open-source Argos Translate models. No API keys, no rate limits, no data sent to third parties — a drop-in replacement for Google Translate when privacy matters.",{"id":42,"uuid":43,"slug":44,"title":45,"description":46,"author_name":47,"view_count":48,"vote_count":24,"lang_type":25,"type":26,"type_label":27},389,"4c628f43-c803-45c8-ae39-a4caded80419","pdfmathtranslate-translate-pdf-papers-preserving-format-4c628f43","PDFMathTranslate — Translate PDF Papers Preserving Format","Translate PDF scientific papers while preserving math formulas, charts, and layout. Supports Google, DeepL, OpenAI, Ollama. CLI, GUI, MCP, Docker, Zotero plugin.","Script Depot",234,{"id":50,"uuid":51,"slug":52,"title":53,"description":54,"author_name":47,"view_count":55,"vote_count":24,"lang_type":25,"type":26,"type_label":27},2354,"834cabb9-43c5-11f1-9bc6-00163e2b0d79","fairseq-sequence-modeling-toolkit-meta-834cabb9","Fairseq — Sequence Modeling Toolkit by Meta","Facebook AI Research sequence modeling toolkit for training custom models in translation, summarization, language modeling, and other text generation tasks.",119,{"id":57,"uuid":58,"slug":59,"title":60,"description":61,"author_name":22,"view_count":62,"vote_count":24,"lang_type":25,"type":26,"type_label":27},1943,"297e4ff3-3e26-11f1-9bc6-00163e2b0d79","nltk-natural-language-processing-toolkit-python-297e4ff3","NLTK — Natural Language Processing Toolkit for Python","NLTK (Natural Language Toolkit) is the foundational Python library for computational linguistics, providing tokenizers, parsers, classifiers, and corpora used in NLP education and research since 2001.",101,{"id":64,"uuid":65,"slug":66,"title":67,"description":68,"author_name":47,"view_count":69,"vote_count":24,"lang_type":25,"type":26,"type_label":27},2308,"29fd01ff-431d-11f1-9bc6-00163e2b0d79","languagetool-self-hosted-grammar-style-checker-25-languages-29fd01ff","LanguageTool — Self-Hosted Grammar and Style Checker for 25+ Languages","An open-source grammar, style, and spell checker that supports over 25 languages and can be self-hosted as an HTTP API server for private proofreading.",165,{"id":71,"uuid":72,"slug":73,"title":74,"description":75,"author_name":22,"view_count":76,"vote_count":24,"lang_type":25,"type":26,"type_label":27},1865,"13b1fee7-3cf7-11f1-9bc6-00163e2b0d79","vale-syntax-aware-prose-linter-technical-writing-13b1fee7","Vale — Syntax-Aware Prose Linter for Technical Writing","Vale is a command-line tool that enforces writing style guides on your prose, supporting custom rules for documentation teams to ensure consistent terminology, tone, and formatting across Markdown, AsciiDoc, and more.",69,{"id":34,"uuid":78,"slug":79,"title":80,"description":81,"author_name":82,"view_count":83,"vote_count":24,"lang_type":25,"type":26,"type_label":27},"eb0f9dd6-2172-4c9f-aca9-97846b0f4d86","whisper-openai-speech-text-eb0f9dd6","Whisper — OpenAI Speech-to-Text","OpenAI's open-source speech recognition model. Transcribe audio\u002Fvideo to text with word-level timestamps in 99 languages. Essential for subtitle generation.","OpenAI",214,{"id":85,"uuid":86,"slug":87,"title":88,"description":89,"author_name":22,"view_count":90,"vote_count":24,"lang_type":25,"type":26,"type_label":27},2632,"e0ea662e-47b4-11f1-9bc6-00163e2b0d79","krillinai-ai-video-translation-dubbing-100-languages-e0ea662e","KrillinAI — AI Video Translation and Dubbing in 100 Languages","An open-source tool that uses LLMs to translate and dub video content into over 100 languages with one-click deployment, optimized for YouTube, TikTok, and other platforms.",85,"tokrepo install pack\u002Ftranslator-multilingual-stack",{"pageType":93,"pageKey":8,"locale":94,"title":95,"metaDescription":96,"h1":97,"tldr":98,"bodyMarkdown":99,"faq":100,"schema":116,"internalLinks":122,"citations":135,"wordCount":148,"generatedAt":149},"pack","zh","译者的多语种栈 — 10 个工具搭一条真本地化流水线","Weblate \u002F Tolgee \u002F LibreTranslate \u002F PDFMathTranslate \u002F Fairseq \u002F NLTK \u002F LanguageTool \u002F Vale \u002F Whisper \u002F KrillinAI — 10 件资产给本地化工程师、译者、i18n PM 跑一条真的「抽取 → 术语表 → 翻译 → QA → 回注」流水线。全套可自托管，格式感知，术语严格。","译者的多语种栈 — 真 i18n 流水线的 10 个候选","10 个工具按本地化流水线真实顺序排：TMS 抽取\u002F回注字符串、术语表 owner、两个翻译引擎（LLM + NMT 可互兜底）、两道 QA（术语 + 语法）、外加 PDF 和视频两种硬格式的专门工具。全套自托管。","## 这个 pack 包含什么\n\n这是给真正在干活的**本地化工程师、译者、i18n PM** 的栈 — 就是那个要把 po\u002Fxliff\u002Fjson 文件交付出去、不能让 build 挂、不能把占位符 `{username}` 弄丢、不能因为 LLM 忘了这是个 SaaS 应用就把 \"trial\" 翻成「法庭审判」的人。\n\n它**不是**一个魔法翻译器。本地化的活分五步 — 抽取、建术语表、翻译、QA、回注 — 每一步都有自己的工具和自己的翻车点。这个 pack 在每一步给一个默认选项，再在两个容易翻车的步骤（翻译引擎本身、TMS 啃不动的格式）各给一个兜底。\n\n下面全部**可自托管**。这件事很重要：公司里真正的 translation memory 通常也是法律敏感内容（合同、未发布的 release notes、客服工单）。不假思索就丢给第三方 MT 厂商，是合规电话会议的开端。\n\n## 推荐安装顺序（抽取 → 术语表 → 翻译 → QA → 回注）\n\n1. **Weblate** — TMS。从这里起步，因为其他所有工具都接到它上面。Weblate 盯你的 git 仓库，从 gettext\u002Fxliff\u002Fjson\u002Fproperties 抽字符串，交给译者（或 MT 引擎）翻译，再以 commit 形式推回去。Docker 自托管，一下午搭完。\n2. **Tolgee** — 开发者友好版替代。如果你的译者不懂技术、需要在运行中的应用里 alt-click 就能编辑字符串的「上下文编辑器」，选 Tolgee 而不是 Weblate。多数团队二选一：git 原生工程团队选 Weblate，产品驱动团队选 Tolgee。\n3. **LibreTranslate** — NMT 引擎。自托管 Argos 模型，无 API key，无限流。这是 LLM 太慢、太贵或者拒绝翻译时的兜底。接进 Weblate 当自动建议后端。\n4. **Fairseq** — 当你要在自家语料上真训练或微调 NMT 模型时。多数团队不会走到这里。会走到这一步的（强监管行业、低资源语种、post-edit 量极大的工作流）也躲不掉。知道它存在已经是一半。\n5. **Claude \u002F GPT-4 级 LLM**（通过 IDE 或 API）— 上下文感知译者。给那些必须读起来像人写的字符串用：营销文案、面向用户的报错、新手引导。**永远**把术语表和上下文一起放进 prompt，永远。\n6. **NLTK** — Python NLP 工具箱。中间环节那些不起眼的活全靠它：分词、断句、给术语表挖候选词、计算翻译输出的 BLEU\u002FchrF。它不是翻译器，是胶带。\n7. **LanguageTool** — 25+ 语言的语法 + 风格 QA。跑在**翻译后**的文本上，不是源文本。它抓的是那一类静默 bug：翻译语法上是错的，但非母语审稿人根本看不出来（德语词格、法语一致性、西语 ser\u002Festar）。\n8. **Vale** — 带自定义规则包的散文 linter。这是你的**术语**执行者：风格指南说「写 sign in 不写 login」就禁掉 login、禁止翻译 \"Pull Request\"、营销语种里禁某种语气。和 LanguageTool 配对：Vale 抓政策违规，LanguageTool 抓语法。\n9. **PDFMathTranslate** — 保留排版、公式、图表地翻译 PDF。其他 PDF 翻译器全做错的那件事。技术文档、学术论文、必须回到 PDF 的监管申报都需要它。\n10. **Whisper + KrillinAI** — 当源是**口语**时。Whisper 抓带时间戳的转写；KrillinAI 包办整条「视频翻到 100 种语言」的流水线，需要的话还能配音。源是视频时才用这俩 — 它们是 TMS 啃不动的格式逃生口。\n\n## 它们怎么协同（翻译流水线）\n\n```\n  源内容 (po \u002F xliff \u002F json \u002F md \u002F pdf \u002F video)\n        │\n        ▼\n   ┌──── Weblate (或 Tolgee) ────┐\n   │   抽字符串 + 分段              │\n   │   ─────────────────────────  │\n   │   PDF → PDFMathTranslate    │\n   │   视频 → Whisper + Krillin  │\n   └──────────────┬───────────────┘\n                  ▼\n            术语表 (TMX\u002FCSV)\n          由术语 owner 维护\n                  │\n                  ▼\n     ┌──── 翻译 ────┐\n     │  ╱         ╲ │\n     │ LLM (上下   LibreTranslate │\n     │  文感知)    (批量 + 兜底)   │\n     │   ╲       ╱  │\n     │   Fairseq (要微调时) │\n     └──────┬───────┘\n            ▼\n      ┌──── QA 闸 ────┐\n      │ Vale (术语)    │\n      │   AND          │\n      │ LanguageTool (语法) │\n      │   AND          │\n      │ NLTK (BLEU\u002FchrF 评分) │\n      └──────┬───────────┘\n             ▼\n     Weblate commit 回注 → git → build\n```\n\n关键的环节是 **QA 闸**：Vale + LanguageTool 双双通过、术语报告显示零违规之前，任何字符串都不许进回注那一步。没这个闸，规模一上来 LLM 的上下文丢失就会把你吃掉。\n\n## 你会遇到的取舍\n\n- **LLM vs Google Translate vs DeepL vs LibreTranslate** — LLM 赢在上下文（它知道 `{user_name}` 是占位符不是词）。DeepL 赢在欧洲语言的流畅度。Google 赢在语种覆盖广。LibreTranslate 赢在成本 + 隐私因为跑在你 VPC 里。生产环境按字符串路由：营销文案 → LLM、UI 字符串 → DeepL 或 NMT、内部文档 → LibreTranslate。\n- **术语表的松紧** — 太严翻译读起来像机器人。太松一个产品里「sign in」「log in」「登入」「登录」「登陆」会同时存在。中间路线：**品牌词**和**法律词**硬执行、风格选择软建议、审稿人可以带评论覆盖。\n- **Weblate vs Tolgee vs Lokalise\u002FCrowdin** — 托管 SaaS（Lokalise、Crowdin、Phrase）上手快但锁定你、按字符串收费。Weblate 是「译者活在 git 里」时的开源默认。Tolgee 是「译者需要上下文编辑」时的开源默认。除非你真需要那些集成而且不在乎账单，跳过 SaaS。\n- **MT 预翻 + 后编辑 vs 纯人工** — 90% 的字符串，MT + 后编辑比纯人工快 3-5 倍、质量相同。失败的那 10%（法律、品牌语气、笑话、文化梗）在源文件里**提前**用 tag 标出来、单独走纯人工。把整个 App 当成 10% 处理是本地化成本爆炸的方式。\n\n## 常见踩坑\n\n- **上下文丢失** — 翻译 `Save` 时不知道这是按钮、功能名、还是「已保存」的过去时。修复：把截图 URL、上下文句子、UI 组件类型一起塞进 translation memory。Tolgee 原生支持；Weblate 要装截图插件。\n- **格式破坏** — 弄丢 `{count}` 占位符、把 `\u003Ca href=\"...\">` 的 HTML 写坏、删掉行尾换行。commit 前永远拿翻译后字符串的**形状**和源做对比验证。Weblate 有占位符检查；打开它。\n- **术语漂移** — 半年里三个译者各自给 \"workspace\" 选了不同的词。每周跑 Vale + 术语审计；术语违规要当 CI 失败处理，不是软警告。\n- **复数形式** — 英语 2 种复数、俄语 3 种、阿拉伯语 6 种、中文 1 种。从 day 1 就用 ICU MessageFormat，不要字符串拼接复数。\n- **RTL 语言** — 阿拉伯语和希伯来语不只是把文字翻转，还翻转布局、括号、标点规则。RTL 要在 QA 里测，不是在生产里测。\n- **没脱敏就把 TM 喂给第三方 LLM** — 你的 translation memory 里有未发布的 release notes 和所有客服工单。在内容**离开 VPC 之前**脱敏 PII 和未公开内容。LibreTranslate 存在就是为了这个原因。",[101,104,107,110,113],{"q":102,"a":103},"Weblate 和 Tolgee 真的要都装吗？","不用 — 二选一。如果你的译者用 git 顺手、整条流水线想保持工程师习惯（PR、commit 历史、CI 闸），默认 Weblate。如果你的译者不懂技术、想在运行中的应用里 alt-click 字符串直接改，默认 Tolgee。两个都试的团队最后会把不匹配自己译者干活方式的那个砍掉。pack 把两个都列出来是因为选哪个取决于团队，不取决于技术。",{"q":105,"a":106},"Claude 这种 LLM 啥都能翻，为啥还要 LibreTranslate？","三个原因。一是成本：LibreTranslate 跑在自己硬件上无 token 计费，5 万字符串的产品做批量预翻译，成本差距很大。二是延迟：LibreTranslate 毫秒级返回，LLM 秒级。三是隐私：translation memory 里通常有未发布的产品细节、合同、客户数据 — 留在自己 VPC 很重要。能跑的模式是：上下文重的字符串（营销、报错）给 LLM、一致性和成本重的字符串（批量 UI、内部文档）给 NMT。",{"q":108,"a":109},"Vale 和 LanguageTool 有啥区别 — 不都是 linter？","它们解决不同的层。LanguageTool 是语法检查器：它懂德语词格、法语一致性、西语 ser\u002Festar — 这些是译者可能错是因为**目标语言**本身难。Vale 是风格和术语 linter：执行你的风格指南（「绝不写 login，永远写 sign in」「绝不翻译 Pull Request」）。两个都要。LanguageTool 抓语法漂移，Vale 抓政策漂移。只跑一个，会留一类 bug 不设防。",{"q":111,"a":112},"这周能跑起来的最小版本是啥？","三件套：Weblate（Docker，一下午就能对着 git 仓库搭起来）、LibreTranslate（Docker 一个容器，接成 Weblate 的 MT 建议引擎）、Vale（CLI，一个配置文件写禁用词列表）。这三件就有了「抽取 → MT 预翻 → 术语闸 → commit」。下周加 LanguageTool 抓 LibreTranslate 抓不到的语法 bug。再下一步给营销文案加 LLM 通道。pack 其他工具，等你撞到三件套基线啃不动的格式时再加。",{"q":114,"a":115},"源代码、截图、术语表、TMS 几头分裂，怎么让译者出活儿？","最大的杠杆是把**真实 UI 的截图**放进 translation memory、按字符串绑定。Tolgee 一键搞定；Weblate 要装截图插件 + 写个小 CI 任务每个组件上传一张 Storybook 截图。译者能看到自己在翻什么之后，UI 字符串的吞吐量大概涨 30-50%，「德语翻译撑爆按钮」的 bug 报告也会消失。第二个杠杆是**自动加载相似字符串的最近 5 条翻译**作为上下文 — 多数 TMS 都有，打开它。",{"@context":117,"@type":118,"name":13,"description":119,"numberOfItems":120,"inLanguage":121},"https:\u002F\u002Fschema.org","ItemList","10 个可自托管的资产，搭一条真本地化流水线：TMS、NMT、LLM 翻译、术语 QA、语法 QA，外加 PDF 和视频两种硬格式的专门工具。",10,"zh-CN",[123,127,131],{"url":124,"anchor":125,"reason":126},"\u002Fzh\u002Fai-tools-for\u002Ftranslation","TokRepo 翻译工具集","更大的翻译与语言资产目录",{"url":128,"anchor":129,"reason":130},"\u002Fzh\u002Fai-tools-for\u002Fautomation","AI Agent 自动化工具集","Weblate 与 QA 闸都接进更大的 CI 自动化栈",{"url":132,"anchor":133,"reason":134},"\u002Fzh\u002Ftopics","浏览其他主题 Pack","更多角色化的 pack：工程师、ML、独立开发者",[136,140,144],{"claim":137,"source_name":138,"source_url":139},"Weblate 是基于 Web 的持续本地化平台","Weblate 官方文档","https:\u002F\u002Fdocs.weblate.org\u002F",{"claim":141,"source_name":142,"source_url":143},"LibreTranslate 是基于 Argos Translate 的自托管翻译 API","LibreTranslate GitHub","https:\u002F\u002Fgithub.com\u002FLibreTranslate\u002FLibreTranslate",{"claim":145,"source_name":146,"source_url":147},"Vale 是带自定义规则包的语法感知散文 linter","Vale 官方文档","https:\u002F\u002Fvale.sh\u002F",2050,"2026-05-22T14:00:00Z"]