Newer
Older
from new_experiment.new_dependency_provider import get_experiment_repository, get_minio_audio_record_repository
from new_experiment.utils.loaded_remote_dataset_helper import LoadedRemoteDatasetHelper
from new_experiment.utils.property_helper import PropertyHelper
from sziszapangma.integration.experiment_manager import ExperimentManager
from sziszapangma.integration.task.classic_wer_metric_task import ClassicWerMetricTask
def run_word_wer_classic_pipeline(dataset_name: str, asr_name: str):
repository = get_experiment_repository(dataset_name)
experiment_processor = ExperimentManager(
record_id_iterator=LoadedRemoteDatasetHelper(repository, get_minio_audio_record_repository(), dataset_name),
processing_tasks=[
ClassicWerMetricTask(
task_name=f'ClassicWerMetricTask___{dataset_name}___{asr_name}',
asr_property_name=PropertyHelper.asr_result(asr_name),
gold_transcript_property_name=PropertyHelper.get_gold_transcript_words(),
metrics_property_name=PropertyHelper.word_wer_classic_metrics(asr_name),
alignment_property_name=PropertyHelper.word_wer_classic_alignment(asr_name)
),
],
experiment_repository=repository
)
experiment_processor.process()
if __name__ == '__main__':
run_word_wer_classic_pipeline('de_minds14', 'whisper_tiny')