Skip to content

Commit 9c711c3

Browse files
committed
LLMs Benchmark
1 parent 503d563 commit 9c711c3

20 files changed

+4081
-0
lines changed

.gitignore

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -12,3 +12,5 @@ OPENROUTER_INTEGRATION_PLAN.md
1212
build_installer.bat
1313
build/
1414
/dist
15+
/benchmark_results/
16+
/wiki/

benchmark/__init__.py

Lines changed: 30 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,30 @@
1+
"""
2+
Benchmark module for multilingual translation quality testing.
3+
4+
This module provides tools for:
5+
- Running translation benchmarks across multiple languages and models
6+
- Evaluating translation quality via LLM (OpenRouter)
7+
- Generating GitHub wiki pages with results
8+
"""
9+
10+
from benchmark.config import BenchmarkConfig
11+
from benchmark.models import (
12+
Language,
13+
LanguageCategory,
14+
ReferenceText,
15+
TranslationResult,
16+
EvaluationScores,
17+
BenchmarkRun,
18+
)
19+
20+
__version__ = "1.0.0"
21+
22+
__all__ = [
23+
"BenchmarkConfig",
24+
"Language",
25+
"LanguageCategory",
26+
"ReferenceText",
27+
"TranslationResult",
28+
"EvaluationScores",
29+
"BenchmarkRun",
30+
]

0 commit comments

Comments
 (0)