Spaces:
Runtime error
Runtime error
File size: 1,308 Bytes
ec8f374 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 |
"""
Evaluation Module
This module provides comprehensive model evaluation and benchmarking tools.
Includes benchmark building, certification tests, gap analysis, and training recommendations.
"""
from .metrics import Metrics, calculate_perplexity, calculate_bleu
from .evaluator import ModelEvaluator, EvaluationConfig
from .benchmark import Benchmark, BenchmarkSuite
from .benchmark_builder import Benchmark as BenchmarkBuilder, BenchmarkSuite as BenchmarkBuilderSuite
from .certification_tests import (
CertificationTestBuilder,
FinancialCertificationTests,
MedicalCertificationTests,
LegalCertificationTests,
EducationCertificationTests,
get_certification_tests_for_domain
)
from .gap_analyzer import GapAnalyzer
from .training_recommender import TrainingRecommender
__all__ = [
# Original exports
'Metrics',
'calculate_perplexity',
'calculate_bleu',
'ModelEvaluator',
'EvaluationConfig',
'Benchmark',
'BenchmarkSuite',
# New exports
'BenchmarkBuilder',
'BenchmarkBuilderSuite',
'CertificationTestBuilder',
'FinancialCertificationTests',
'MedicalCertificationTests',
'LegalCertificationTests',
'EducationCertificationTests',
'get_certification_tests_for_domain',
'GapAnalyzer',
'TrainingRecommender'
]
|