{
"benchmark.actions.delete": "Delete Benchmark",
"benchmark.actions.delete.confirm": "Are you sure you want to delete this benchmark? Related datasets and evaluation records will also be deleted.",
"benchmark.actions.edit": "Edit Benchmark",
"benchmark.actions.export": "Export",
"benchmark.card.bestScore": "Best",
"benchmark.card.caseCount": "{{count}} cases",
"benchmark.card.datasetCount": "{{count}} datasets",
"benchmark.card.empty": "No evaluations yet",
"benchmark.card.emptyHint": "Create a new evaluation from the benchmark detail page",
"benchmark.card.importDataset": "Import Dataset",
"benchmark.card.noDataset": "No datasets yet",
"benchmark.card.noDatasetHint": "Import a dataset to start evaluating",
"benchmark.card.noRecentRuns": "No recent evaluations to display",
"benchmark.card.recentRuns": "Recent Evaluations",
"benchmark.card.runCount": "{{count}} evals",
"benchmark.card.startFirst": "Start First Evaluation",
"benchmark.card.viewAll": "View all {{count}}",
"benchmark.create.confirm": "Create",
"benchmark.create.description.label": "Description",
"benchmark.create.description.placeholder": "Benchmark description (optional)",
"benchmark.create.error": "Failed to create benchmark",
"benchmark.create.identifier.label": "Identifier",
"benchmark.create.identifier.placeholder": "benchmark-identifier",
"benchmark.create.identifierRequired": "Please enter an identifier",
"benchmark.create.name.label": "Name",
"benchmark.create.name.placeholder": "Enter benchmark name",
"benchmark.create.nameRequired": "Please enter a benchmark name",
"benchmark.create.success": "Benchmark created successfully",
"benchmark.create.tags.label": "Tags",
"benchmark.create.tags.placeholder": "Add tags, separate with comma or space",
"benchmark.create.title": "Create Benchmark",
"benchmark.detail.backToOverview": "Back to Overview",
"benchmark.detail.datasetCount": "{{count}} dataset{{count, plural, one {} other {s}}} in this benchmark",
"benchmark.detail.runCount": "{{count}} evaluation run{{count, plural, one {} other {s}}} on this benchmark",
"benchmark.detail.stats.addFirstDataset": "Click to add first dataset",
"benchmark.detail.stats.avgCost": "Avg Cost",
"benchmark.detail.stats.avgDuration": "Avg Duration",
"benchmark.detail.stats.basedOnLastNRuns": "Based on last {{count}} runs",
"benchmark.detail.stats.bestPerformance": "Best performance by {{agent}} with {{passRate}}% pass rate",
"benchmark.detail.stats.bestScore": "Best Score",
"benchmark.detail.stats.cases": "Cases",
"benchmark.detail.stats.dataScale": "Data Scale",
"benchmark.detail.stats.datasets": "Datasets",
"benchmark.detail.stats.needSetup": "Setup Required",
"benchmark.detail.stats.noEvalRecord": "No evaluation records yet",
"benchmark.detail.stats.perRun": "/ Run",
"benchmark.detail.stats.runs": "Runs",
"benchmark.detail.stats.tags": "Tags",
"benchmark.detail.stats.topAgents": "Top Agents",
"benchmark.detail.stats.totalCases": "Total Cases",
"benchmark.detail.stats.waiting": "Waiting...",
"benchmark.detail.tabs.data": "Data",
"benchmark.detail.tabs.datasets": "Datasets",
"benchmark.detail.tabs.runs": "Runs",
"benchmark.edit.confirm": "Save",
"benchmark.edit.error": "Failed to update benchmark",
"benchmark.edit.success": "Benchmark updated successfully",
"benchmark.edit.title": "Edit Benchmark",
"benchmark.empty": "No benchmarks yet. Create one to get started.",
"caseDetail.actual": "Actual Output",
"caseDetail.chatArea.title": "Conversation",
"caseDetail.completionReason": "Status",
"caseDetail.cost": "Cost",
"caseDetail.difficulty": "Difficulty",
"caseDetail.duration": "Duration",
"caseDetail.expected": "Expected Output",
"caseDetail.failureReason": "Failure Reason",
"caseDetail.input": "Input",
"caseDetail.judgeComment": "Judge Comment",
"caseDetail.resources": "Resources",
"caseDetail.score": "Score",
"caseDetail.section.runtime": "Runtime",
"caseDetail.section.scoring": "Scoring Details",
"caseDetail.section.testCase": "Test Case",
"caseDetail.steps": "Steps",
"caseDetail.threads.attempt": "Trajectory #{{number}}",
"caseDetail.tokens": "Token Usage",
"common.cancel": "Cancel",
"common.create": "Create",
"common.delete": "Delete",
"common.edit": "Edit",
"common.later": "Later",
"common.next": "Next",
"common.update": "Update",
"dataset.actions.addDataset": "Add Dataset",
"dataset.actions.import": "Import Data",
"dataset.actions.importDataset": "Import Dataset",
"dataset.create.description.label": "Description",
"dataset.create.description.placeholder": "Dataset description (optional)",
"dataset.create.error": "Failed to create dataset",
"dataset.create.identifier.label": "Identifier",
"dataset.create.identifier.placeholder": "dataset-identifier",
"dataset.create.identifierRequired": "Please enter an identifier",
"dataset.create.importNow": "Would you like to import data now?",
"dataset.create.name.label": "Dataset Name",
"dataset.create.name.placeholder": "Enter dataset name",
"dataset.create.nameRequired": "Please enter a dataset name",
"dataset.create.preset.label": "Dataset Preset",
"dataset.create.success": "Dataset created successfully",
"dataset.create.successTitle": "Dataset Created",
"dataset.create.title": "Create Dataset",
"dataset.delete.confirm": "Are you sure you want to delete this dataset? All test cases in it will also be deleted.",
"dataset.delete.error": "Failed to delete dataset",
"dataset.delete.success": "Dataset deleted successfully",
"dataset.detail.addRun": "New Run",
"dataset.detail.backToBenchmark": "Back to Benchmark",
"dataset.detail.caseCount": "{{count}} test case{{count, plural, one {} other {s}}}",
"dataset.detail.relatedRuns": "Related Runs ({{count}})",
"dataset.detail.testCases": "Test Cases",
"dataset.detail.viewDetail": "View Details",
"dataset.edit.error": "Failed to update dataset",
"dataset.edit.success": "Dataset updated successfully",
"dataset.edit.title": "Edit Dataset",
"dataset.empty": "No datasets",
"dataset.empty.description": "Import a dataset to start building this benchmark",
"dataset.empty.title": "No datasets yet",
"dataset.evalMode.hint": "Default eval mode for the dataset, can be overridden at test case level",
"dataset.import.category": "Category",
"dataset.import.categoryDesc": "Classification label for grouping",
"dataset.import.choices": "Choices",
"dataset.import.choicesDesc": "Multiple-choice options",
"dataset.import.confirm": "Import",
"dataset.import.error": "Failed to import dataset",
"dataset.import.expected": "Expected Answer",
"dataset.import.expectedDelimiter": "Answer Delimiter",
"dataset.import.expectedDelimiter.desc": "Answer delimiter",
"dataset.import.expectedDelimiter.placeholder": "e.g. | or ,",
"dataset.import.expectedDesc": "Correct answer to compare against",
"dataset.import.fieldMapping": "Field Mapping",
"dataset.import.fieldMapping.desc": "\"Input\" column is required",
"dataset.import.hideSkipped": "Hide skipped columns",
"dataset.import.ignore": "Skip",
"dataset.import.ignoreDesc": "Do not import this column",
"dataset.import.input": "Input",
"dataset.import.inputDesc": "Question or prompt sent to model",
"dataset.import.metadata": "Metadata",
"dataset.import.metadataDesc": "Extra info, stored as-is",
"dataset.import.next": "Next",
"dataset.import.parseError": "Failed to parse file",
"dataset.import.parsing": "Parsing file...",
"dataset.import.prev": "Previous",
"dataset.import.preview": "Data Preview",
"dataset.import.preview.desc": "Confirm the mapping is correct, then import.",
"dataset.import.preview.rows": "{{count}} rows total",
"dataset.import.sortOrder": "Item Number",
"dataset.import.sortOrderDesc": "Question/item ID for reference",
"dataset.import.step.mapping": "Map Fields",
"dataset.import.step.preview": "Preview",
"dataset.import.step.upload": "Upload File",
"dataset.import.success": "Successfully imported {{count}} test cases",
"dataset.import.title": "Import Dataset",
"dataset.import.upload.hint": "Supports CSV, XLSX, JSON, JSONL",
"dataset.import.upload.text": "Click or drag file here to upload",
"dataset.import.uploading": "Uploading...",
"dataset.switchDataset": "Switch Dataset",
"difficulty.easy": "Easy",
"difficulty.hard": "Hard",
"difficulty.medium": "Medium",
"evalMode.answer-relevance": "LLM Relevance",
"evalMode.answer-relevance.desc": "Use LLM to evaluate answer relevance (yes or no)",
"evalMode.contains": "Contains Match",
"evalMode.contains.desc": "Output must contain the expected text",
"evalMode.equals": "Exact Match",
"evalMode.equals.desc": "Output must be exactly the same as expected",
"evalMode.external": "External Eval",
"evalMode.external.desc": "Agent runs to completion; scoring is handled by an external system",
"evalMode.label": "Eval Mode",
"evalMode.llm-rubric": "LLM Judge",
"evalMode.llm-rubric.desc": "Use LLM to evaluate output quality based on custom criteria (0.0 to 1.0)",
"evalMode.placeholder": "Select eval mode",
"evalMode.prompt.label": "Judge Prompt",
"evalMode.prompt.placeholder": "Enter the evaluation criteria or prompt for LLM judge",
"evalMode.rubric": "Rubric Scoring",
"evalMode.rubric.desc": "Score output using benchmark rubrics with weighted criteria",
"overview.createBenchmark": "Create Benchmark",
"overview.importDataset": "Import Dataset",
"overview.subtitle": "Benchmark and evaluate your AI agents across datasets",
"overview.title": "Evaluation Lab",
"run.actions.abort": "Abort",
"run.actions.abort.confirm": "Are you sure you want to abort this evaluation?",
"run.actions.batchResume": "Batch Resume",
"run.actions.batchResume.modal.confirm": "Resume Selected",
"run.actions.batchResume.modal.selectAll": "Select All",
"run.actions.batchResume.modal.selected": "{{count}} selected",
"run.actions.batchResume.modal.title": "Batch Resume Cases",
"run.actions.create": "New Evaluation",
"run.actions.delete": "Delete",
"run.actions.delete.confirm": "Are you sure you want to delete this evaluation?",
"run.actions.edit": "Edit",
"run.actions.resumeCase": "Resume",
"run.actions.retryCase": "Retry",
"run.actions.retryErrors": "Retry Errors",
"run.actions.retryErrors.confirm": "This will re-run all error and timeout cases. Passed and failed cases will not be affected.",
"run.actions.run": "Run",
"run.actions.start": "Start",
"run.actions.start.confirm": "Are you sure you want to start this evaluation?",
"run.chart.duration": "Duration (s)",
"run.chart.error": "Error",
"run.chart.fail": "Fail",
"run.chart.latencyDistribution": "Latency Distribution",
"run.chart.latencyTokenDistribution": "Latency / Token Distribution",
"run.chart.pass": "Pass",
"run.chart.passFailError": "Pass / Fail / Error",
"run.chart.tokens": "Tokens",
"run.config.agentId": "Agent",
"run.config.concurrency": "Concurrency",
"run.config.judgeModel": "Judge Model",
"run.config.k": "Executions (K)",
"run.config.k.hint": "Run each test case {{k}} times for pass@{{k}}/pass^{{k}} metrics",
"run.config.maxSteps": "Max Steps",
"run.config.maxSteps.hint": "Each LLM call or tool call by the agent counts as 1 step",
"run.config.model": "Model",
"run.config.temperature": "Temperature",
"run.config.timeout": "Timeout",
"run.config.timeout.unit": "min",
"run.create.advanced": "Advanced Settings",
"run.create.agent": "Agent",
"run.create.agent.placeholder": "Select an agent",
"run.create.agent.required": "Please select an agent",
"run.create.caseCount": "{{count}} cases",
"run.create.confirm": "Create & Start",
"run.create.createOnly": "Create",
"run.create.dataset": "Dataset",
"run.create.dataset.placeholder": "Select a dataset",
"run.create.dataset.required": "Please select a dataset",
"run.create.name": "Run Name",
"run.create.name.placeholder": "Enter a name for this run",
"run.create.name.required": "Please enter a run name",
"run.create.name.useTimestamp": "Use current time as name",
"run.create.openAgent": "Open agent in new window",
"run.create.title": "New Evaluation",
"run.create.titleWithDataset": "New Evaluation on \"{{dataset}}\"",
"run.detail.agent": "Agent",
"run.detail.agent.none": "Not specified",
"run.detail.agent.unnamed": "Unnamed Agent",
"run.detail.backToBenchmark": "Back to Benchmark",
"run.detail.caseResults": "Eval Details",
"run.detail.config": "Evaluation Config",
"run.detail.configSnapshot": "Configuration Snapshot",
"run.detail.copyRunId": "Copy Run ID",
"run.detail.copyRunIdFailed": "Failed to copy Run ID",
"run.detail.copyRunIdSuccess": "Run ID copied",
"run.detail.dataset": "Dataset",
"run.detail.model": "Model",
"run.detail.overview": "Overview",
"run.detail.progress": "Progress",
"run.detail.progressCases": "cases",
"run.detail.report": "Evaluation Summary",
"run.edit.error": "Failed to update evaluation",
"run.edit.success": "Evaluation updated successfully",
"run.edit.title": "Edit Evaluation",
"run.empty.description": "Start your first evaluation run on this dataset",
"run.empty.descriptionBenchmark": "Start your first evaluation run on this benchmark",
"run.empty.title": "No runs yet",
"run.external.hint": "Running completed. Waiting for external system to submit evaluation results ...",
"run.filter.active": "Active",
"run.filter.empty": "No runs match the current filter.",
"run.idle.hint": "Click Start to begin evaluation",
"run.metrics.avgScore": "Avg Score",
"run.metrics.cost": "Cost",
"run.metrics.duration": "Duration",
"run.metrics.errorCases": "Error",
"run.metrics.evaluated": "{{count}} evaluated",
"run.metrics.passRate": "Pass Rate",
"run.metrics.perCase": "/ case",
"run.metrics.tokens": "Tokens",
"run.metrics.totalDuration": "Cumulative",
"run.pending.hint": "Evaluation is queued, waiting to start...",
"run.running.hint": "Evaluation is running, results will appear shortly...",
"run.status.aborted": "Aborted",
"run.status.completed": "Completed",
"run.status.completed.tooltip": "The run and external scoring are completed.",
"run.status.error": "Run Error",
"run.status.external": "Awaiting Eval",
"run.status.external.tooltip": "The agent has finished running. Waiting for an external system to submit evaluation results.",
"run.status.failed": "Failed",
"run.status.idle": "Idle",
"run.status.pending": "Pending",
"run.status.running": "Running",
"run.status.timeout": "Timeout",
"sidebar.benchmarks": "Benchmarks",
"sidebar.dashboard": "Dashboard",
"sidebar.datasets": "Datasets",
"sidebar.runs": "Runs",
"table.columns.avgCost": "Avg Cost",
"table.columns.category": "Category",
"table.columns.cost": "Cost",
"table.columns.difficulty": "Difficulty",
"table.columns.duration": "Duration",
"table.columns.evalMode": "Eval Mode",
"table.columns.expected": "Expected Answer",
"table.columns.input": "Input",
"table.columns.score": "Score",
"table.columns.status": "Status",
"table.columns.steps": "Steps",
"table.columns.tags": "Tags",
"table.columns.tokens": "Tokens",
"table.columns.totalCost": "Total Cost",
"table.filter.all": "All",
"table.filter.error": "Run Error",
"table.filter.failed": "Failed",
"table.filter.passed": "Passed",
"table.filter.running": "Running",
"table.search.placeholder": "Search cases...",
"table.total": "Total {{count}}",
"testCase.actions.add": "Add Test Case",
"testCase.actions.import": "Import Test Cases",
"testCase.create.advanced": "More Options",
"testCase.create.difficulty.label": "Difficulty",
"testCase.create.error": "Failed to add test case",
"testCase.create.expected.label": "Expected Output",
"testCase.create.expected.placeholder": "Enter the expected answer",
"testCase.create.expected.required": "Please enter the expected output",
"testCase.create.input.label": "Input",
"testCase.create.input.placeholder": "Enter the test case input or question",
"testCase.create.success": "Test case added successfully",
"testCase.create.tags.label": "Tags",
"testCase.create.tags.placeholder": "Comma-separated tags (optional)",
"testCase.create.title": "Add Test Case",
"testCase.delete.confirm": "Are you sure you want to delete this test case?",
"testCase.delete.error": "Failed to delete test case",
"testCase.delete.success": "Test case deleted",
"testCase.edit.error": "Failed to update test case",
"testCase.edit.success": "Test case updated successfully",
"testCase.edit.title": "Edit Test Case",
"testCase.empty.description": "Import or manually add test cases to this dataset",
"testCase.empty.title": "No test cases yet",
"testCase.preview.expected": "Expected",
"testCase.preview.input": "Input",
"testCase.preview.title": "Test Case Preview",
"testCase.search.placeholder": "Search cases..."
}