Files

334 lines
16 KiB
JSON
Raw Permalink Blame History

This file contains ambiguous Unicode characters
This file contains Unicode characters that might be confused with other characters. If you think that this is intentional, you can safely ignore this warning. Use the Escape button to reveal them.
{
"benchmark.actions.delete": "删除基准",
"benchmark.actions.delete.confirm": "确定要删除此基准吗?相关数据集和评测记录也会被删除。",
"benchmark.actions.edit": "编辑基准",
"benchmark.actions.export": "导出",
"benchmark.card.bestScore": "最佳",
"benchmark.card.caseCount": "{{count}} 个用例",
"benchmark.card.datasetCount": "{{count}} 个数据集",
"benchmark.card.empty": "暂无评测记录",
"benchmark.card.emptyHint": "前往基准详情页创建新的评测",
"benchmark.card.importDataset": "导入数据集",
"benchmark.card.noDataset": "暂无数据集",
"benchmark.card.noDatasetHint": "导入数据集以开始评测",
"benchmark.card.noRecentRuns": "暂无最近的评测记录",
"benchmark.card.recentRuns": "最近评测",
"benchmark.card.runCount": "{{count}} 次评测",
"benchmark.card.startFirst": "开始首次评测",
"benchmark.card.viewAll": "查看全部 {{count}} 条",
"benchmark.create.confirm": "创建",
"benchmark.create.description.label": "描述",
"benchmark.create.description.placeholder": "基准描述(选填)",
"benchmark.create.error": "创建基准失败",
"benchmark.create.identifier.label": "标识符",
"benchmark.create.identifier.placeholder": "benchmark-identifier",
"benchmark.create.identifierRequired": "请输入标识符",
"benchmark.create.name.label": "名称",
"benchmark.create.name.placeholder": "输入基准名称",
"benchmark.create.nameRequired": "请输入基准名称",
"benchmark.create.success": "基准创建成功",
"benchmark.create.tags.label": "标签",
"benchmark.create.tags.placeholder": "添加标签,用逗号或空格分隔",
"benchmark.create.title": "创建基准",
"benchmark.detail.backToOverview": "返回总览",
"benchmark.detail.datasetCount": "此基准包含 {{count}} 个数据集",
"benchmark.detail.runCount": "此基准有 {{count}} 次评测",
"benchmark.detail.stats.addFirstDataset": "点击添加首个数据集",
"benchmark.detail.stats.avgCost": "平均成本",
"benchmark.detail.stats.avgDuration": "平均耗时",
"benchmark.detail.stats.basedOnLastNRuns": "基于最近 {{count}} 次评测",
"benchmark.detail.stats.bestPerformance": "目前最佳表现由 {{agent}} 达成,通过率 {{passRate}}%",
"benchmark.detail.stats.bestScore": "最佳分数",
"benchmark.detail.stats.cases": "用例",
"benchmark.detail.stats.dataScale": "数据规模",
"benchmark.detail.stats.datasets": "数据集",
"benchmark.detail.stats.needSetup": "需配置",
"benchmark.detail.stats.noEvalRecord": "尚无评测记录",
"benchmark.detail.stats.perRun": "/ 次",
"benchmark.detail.stats.runs": "评测",
"benchmark.detail.stats.tags": "标签",
"benchmark.detail.stats.topAgents": "Top Agents",
"benchmark.detail.stats.totalCases": "总用例数",
"benchmark.detail.stats.waiting": "Waiting...",
"benchmark.detail.tabs.data": "数据",
"benchmark.detail.tabs.datasets": "数据集",
"benchmark.detail.tabs.runs": "运行",
"benchmark.edit.confirm": "保存",
"benchmark.edit.error": "更新基准失败",
"benchmark.edit.success": "基准更新成功",
"benchmark.edit.title": "编辑基准",
"benchmark.empty": "暂无基准,请先创建一个。",
"caseDetail.actual": "实际输出",
"caseDetail.chatArea.title": "对话记录",
"caseDetail.completionReason": "状态",
"caseDetail.cost": "费用",
"caseDetail.difficulty": "难度",
"caseDetail.duration": "耗时",
"caseDetail.expected": "期望输出",
"caseDetail.failureReason": "失败原因",
"caseDetail.input": "输入",
"caseDetail.judgeComment": "裁判评语",
"caseDetail.resources": "资源",
"caseDetail.score": "评分",
"caseDetail.section.runtime": "执行信息",
"caseDetail.section.scoring": "评分详情",
"caseDetail.section.testCase": "测试用例",
"caseDetail.steps": "执行步数",
"caseDetail.threads.attempt": "运行轨迹 #{{number}}",
"caseDetail.tokens": "Token 用量",
"common.cancel": "取消",
"common.create": "创建",
"common.delete": "删除",
"common.edit": "编辑",
"common.later": "稍后",
"common.next": "下一步",
"common.update": "更新",
"dataset.actions.addDataset": "添加数据集",
"dataset.actions.import": "导入数据",
"dataset.actions.importDataset": "导入数据集",
"dataset.create.description.label": "描述",
"dataset.create.description.placeholder": "数据集描述(选填)",
"dataset.create.error": "创建数据集失败",
"dataset.create.identifier.label": "标识符",
"dataset.create.identifier.placeholder": "dataset-identifier",
"dataset.create.identifierRequired": "请输入标识符",
"dataset.create.importNow": "是否立即导入数据?",
"dataset.create.name.label": "数据集名称",
"dataset.create.name.placeholder": "输入数据集名称",
"dataset.create.nameRequired": "请输入数据集名称",
"dataset.create.preset.label": "数据集预设",
"dataset.create.success": "数据集创建成功",
"dataset.create.successTitle": "数据集已创建",
"dataset.create.title": "创建数据集",
"dataset.delete.confirm": "确定要删除此数据集吗?其中的所有数据用例也会被删除。",
"dataset.delete.error": "删除数据集失败",
"dataset.delete.success": "数据集删除成功",
"dataset.detail.addRun": "新增运行",
"dataset.detail.backToBenchmark": "返回基准测试",
"dataset.detail.caseCount": "{{count}} 个测试用例",
"dataset.detail.relatedRuns": "相关运行({{count}}",
"dataset.detail.testCases": "测试用例",
"dataset.detail.viewDetail": "查看详情",
"dataset.edit.error": "更新数据集失败",
"dataset.edit.success": "数据集更新成功",
"dataset.edit.title": "编辑数据集",
"dataset.empty": "暂无数据集",
"dataset.empty.description": "导入数据集以开始构建此基准",
"dataset.empty.title": "暂无数据集",
"dataset.evalMode.hint": "数据集默认评估模式,可被用例级别覆盖",
"dataset.import.category": "分类",
"dataset.import.categoryDesc": "用于分组的分类标签",
"dataset.import.choices": "选项",
"dataset.import.choicesDesc": "多选选项",
"dataset.import.confirm": "导入",
"dataset.import.error": "导入数据集失败",
"dataset.import.expected": "期望答案",
"dataset.import.expectedDelimiter": "答案分隔符",
"dataset.import.expectedDelimiter.desc": "答案分隔符",
"dataset.import.expectedDelimiter.placeholder": "如 | 或 ,",
"dataset.import.expectedDesc": "用于对比的正确答案",
"dataset.import.fieldMapping": "字段映射",
"dataset.import.fieldMapping.desc": "必须指定「输入」列",
"dataset.import.hideSkipped": "隐藏跳过的列",
"dataset.import.ignore": "跳过",
"dataset.import.ignoreDesc": "不导入此列",
"dataset.import.input": "输入",
"dataset.import.inputDesc": "发送给模型的问题或提示",
"dataset.import.metadata": "元数据",
"dataset.import.metadataDesc": "额外信息,原样存储",
"dataset.import.next": "下一步",
"dataset.import.parseError": "文件解析失败",
"dataset.import.parsing": "正在解析文件...",
"dataset.import.prev": "上一步",
"dataset.import.preview": "数据预览",
"dataset.import.preview.desc": "确认映射正确后导入。",
"dataset.import.preview.rows": "共 {{count}} 行",
"dataset.import.sortOrder": "题目编号",
"dataset.import.sortOrderDesc": "题目/用例的编号,便于沟通引用",
"dataset.import.step.mapping": "映射字段",
"dataset.import.step.preview": "预览",
"dataset.import.step.upload": "上传文件",
"dataset.import.success": "成功导入 {{count}} 个数据用例",
"dataset.import.title": "导入数据集",
"dataset.import.upload.hint": "支持 CSV、XLSX、JSON、JSONL",
"dataset.import.upload.text": "点击或拖拽文件到此处",
"dataset.import.uploading": "上传中...",
"dataset.switchDataset": "切换数据集",
"difficulty.easy": "简单",
"difficulty.hard": "困难",
"difficulty.medium": "中等",
"evalMode.answer-relevance": "LLM 相关性",
"evalMode.answer-relevance.desc": "使用 LLM 评估答案相关性(是或否)",
"evalMode.contains": "包含匹配",
"evalMode.contains.desc": "输出中必须包含期望的文本",
"evalMode.equals": "精确匹配",
"evalMode.equals.desc": "输出必须与期望内容完全一致",
"evalMode.external": "外部评估",
"evalMode.external.desc": "代理运行完成;评分由外部系统处理",
"evalMode.label": "评估模式",
"evalMode.llm-rubric": "LLM 评判",
"evalMode.llm-rubric.desc": "使用 LLM 评估输出质量",
"evalMode.placeholder": "选择评估模式",
"evalMode.prompt.label": "评判提示词",
"evalMode.prompt.placeholder": "输入 LLM 评判的评估标准或提示词",
"evalMode.rubric": "混合指标评分",
"evalMode.rubric.desc": "使用基准的加权指标进行混合评分",
"overview.createBenchmark": "创建基准",
"overview.importDataset": "导入数据集",
"overview.subtitle": "对你的 AI 助手进行跨数据集的基准测试与评估",
"overview.title": "评测实验室",
"run.actions.abort": "终止",
"run.actions.abort.confirm": "确定要终止此评测吗?",
"run.actions.batchResume": "批量恢复",
"run.actions.batchResume.modal.confirm": "恢复选中项",
"run.actions.batchResume.modal.selectAll": "全选",
"run.actions.batchResume.modal.selected": "已选中 {{count}} 项",
"run.actions.batchResume.modal.title": "批量恢复案例",
"run.actions.create": "新建评测",
"run.actions.delete": "删除",
"run.actions.delete.confirm": "确定要删除此评测吗?",
"run.actions.edit": "编辑",
"run.actions.resumeCase": "恢复",
"run.actions.retryCase": "重试",
"run.actions.retryErrors": "重试错误用例",
"run.actions.retryErrors.confirm": "将重新运行所有错误和超时的用例。已通过和未通过的用例不受影响。",
"run.actions.run": "执行",
"run.actions.start": "启动",
"run.actions.start.confirm": "确定要启动此评测吗?",
"run.chart.duration": "耗时 (s)",
"run.chart.error": "出错",
"run.chart.fail": "失败",
"run.chart.latencyDistribution": "耗时分布",
"run.chart.latencyTokenDistribution": "耗时 / Token 分布",
"run.chart.pass": "通过",
"run.chart.passFailError": "通过 / 失败 / 出错",
"run.chart.tokens": "Tokens",
"run.config.agentId": "执行 Agent",
"run.config.concurrency": "并发数",
"run.config.judgeModel": "裁判模型",
"run.config.k": "执行次数 (K)",
"run.config.k.hint": "每个测试用例执行 {{k}} 次,用于 pass@{{k}}/pass^{{k}} 指标",
"run.config.maxSteps": "最大步数",
"run.config.maxSteps.hint": "Agent 每执行一次 LLM 调用或工具调用都算 1 步",
"run.config.model": "模型",
"run.config.temperature": "温度",
"run.config.timeout": "超时时间",
"run.config.timeout.unit": "分钟",
"run.create.advanced": "高级设置",
"run.create.agent": "执行 Agent",
"run.create.agent.placeholder": "选择助手",
"run.create.agent.required": "请选择一个助手",
"run.create.caseCount": "{{count}} 个用例",
"run.create.confirm": "创建并执行",
"run.create.createOnly": "创建",
"run.create.dataset": "数据集",
"run.create.dataset.placeholder": "选择数据集",
"run.create.dataset.required": "请选择数据集",
"run.create.name": "评测名称",
"run.create.name.placeholder": "输入评测名称",
"run.create.name.required": "请输入评测名称",
"run.create.name.useTimestamp": "使用当前时间作为名称",
"run.create.openAgent": "在新窗口中打开助手",
"run.create.title": "新建评测",
"run.create.titleWithDataset": "基于 {{dataset}} 数据集新建评测",
"run.detail.agent": "执行 Agent",
"run.detail.agent.none": "未指定",
"run.detail.agent.unnamed": "未命名助手",
"run.detail.backToBenchmark": "返回基准测试",
"run.detail.caseResults": "评测明细",
"run.detail.config": "评测配置",
"run.detail.configSnapshot": "配置快照",
"run.detail.copyRunId": "复制运行 ID",
"run.detail.copyRunIdFailed": "复制运行 ID 失败",
"run.detail.copyRunIdSuccess": "运行 ID 已复制",
"run.detail.dataset": "数据集",
"run.detail.model": "模型",
"run.detail.overview": "概览",
"run.detail.progress": "进度",
"run.detail.progressCases": "个用例",
"run.detail.report": "评测概要",
"run.edit.error": "更新评测失败",
"run.edit.success": "评测更新成功",
"run.edit.title": "编辑评测",
"run.empty.description": "在此数据集上开始你的首次评测",
"run.empty.descriptionBenchmark": "在此基准上开始你的首次评测",
"run.empty.title": "尚无运行",
"run.external.hint": "运行已完成。等待外部系统提交评估结果...",
"run.filter.active": "进行中",
"run.filter.empty": "当前筛选条件下无匹配的运行。",
"run.idle.hint": "点击开始以启动评测",
"run.metrics.avgScore": "平均分",
"run.metrics.cost": "费用",
"run.metrics.duration": "耗时",
"run.metrics.errorCases": "出错",
"run.metrics.evaluated": "{{count}} 个已评测",
"run.metrics.passRate": "通过率",
"run.metrics.perCase": "/用例",
"run.metrics.tokens": "Tokens",
"run.metrics.totalDuration": "累计",
"run.pending.hint": "评测已进入运行队列,等待启动中...",
"run.running.hint": "评测进行中,结果即将呈现...",
"run.status.aborted": "已终止",
"run.status.completed": "已完成",
"run.status.completed.tooltip": "运行和外部评分已完成。",
"run.status.error": "运行出错",
"run.status.external": "等待评估",
"run.status.external.tooltip": "代理已完成运行。等待外部系统提交评估结果。",
"run.status.failed": "失败",
"run.status.idle": "待开始",
"run.status.pending": "等待中",
"run.status.running": "进行中",
"run.status.timeout": "超时",
"sidebar.benchmarks": "基准",
"sidebar.dashboard": "总览",
"sidebar.datasets": "数据集",
"sidebar.runs": "评测",
"table.columns.avgCost": "平均成本",
"table.columns.category": "分类",
"table.columns.cost": "成本",
"table.columns.difficulty": "难度",
"table.columns.duration": "耗时",
"table.columns.evalMode": "评估方式",
"table.columns.expected": "期望答案",
"table.columns.input": "输入",
"table.columns.score": "评分",
"table.columns.status": "状态",
"table.columns.steps": "步数",
"table.columns.tags": "标签",
"table.columns.tokens": "Tokens",
"table.columns.totalCost": "总成本",
"table.filter.all": "全部",
"table.filter.error": "运行出错",
"table.filter.failed": "失败",
"table.filter.passed": "通过",
"table.filter.running": "运行中",
"table.search.placeholder": "搜索用例...",
"table.total": "共 {{count}} 条",
"testCase.actions.add": "添加数据用例",
"testCase.actions.import": "导入数据用例",
"testCase.create.advanced": "更多选项",
"testCase.create.difficulty.label": "难度",
"testCase.create.error": "添加数据用例失败",
"testCase.create.expected.label": "期望输出",
"testCase.create.expected.placeholder": "输入期望的回答",
"testCase.create.expected.required": "请输入期望输出",
"testCase.create.input.label": "输入",
"testCase.create.input.placeholder": "输入数据用例的问题或输入内容",
"testCase.create.success": "数据用例添加成功",
"testCase.create.tags.label": "标签",
"testCase.create.tags.placeholder": "用逗号分隔的标签(选填)",
"testCase.create.title": "添加数据用例",
"testCase.delete.confirm": "确定要删除该数据用例吗?",
"testCase.delete.error": "删除数据用例失败",
"testCase.delete.success": "数据用例已删除",
"testCase.edit.error": "更新数据用例失败",
"testCase.edit.success": "数据用例更新成功",
"testCase.edit.title": "编辑数据用例",
"testCase.empty.description": "导入或手动添加数据用例到此数据集",
"testCase.empty.title": "暂无数据用例",
"testCase.preview.expected": "期望",
"testCase.preview.input": "输入",
"testCase.preview.title": "数据用例预览",
"testCase.search.placeholder": "搜索用例..."
}