File size: 1,308 Bytes
ec8f374
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
"""
Evaluation Module

This module provides comprehensive model evaluation and benchmarking tools.
Includes benchmark building, certification tests, gap analysis, and training recommendations.
"""

from .metrics import Metrics, calculate_perplexity, calculate_bleu
from .evaluator import ModelEvaluator, EvaluationConfig
from .benchmark import Benchmark, BenchmarkSuite
from .benchmark_builder import Benchmark as BenchmarkBuilder, BenchmarkSuite as BenchmarkBuilderSuite
from .certification_tests import (
    CertificationTestBuilder,
    FinancialCertificationTests,
    MedicalCertificationTests,
    LegalCertificationTests,
    EducationCertificationTests,
    get_certification_tests_for_domain
)
from .gap_analyzer import GapAnalyzer
from .training_recommender import TrainingRecommender

__all__ = [
    # Original exports
    'Metrics',
    'calculate_perplexity',
    'calculate_bleu',
    'ModelEvaluator',
    'EvaluationConfig',
    'Benchmark',
    'BenchmarkSuite',
    # New exports
    'BenchmarkBuilder',
    'BenchmarkBuilderSuite',
    'CertificationTestBuilder',
    'FinancialCertificationTests',
    'MedicalCertificationTests',
    'LegalCertificationTests',
    'EducationCertificationTests',
    'get_certification_tests_for_domain',
    'GapAnalyzer',
    'TrainingRecommender'
]