Source code for cdp_backend.sr_models.sr_model

#!/usr/bin/env python

from __future__ import annotations

import re
from abc import ABC, abstractmethod
from pathlib import Path
from typing import Any

from ..pipeline import transcript_model

###############################################################################


[docs] class SRModel(ABC):
[docs] @abstractmethod def transcribe( self, file_uri: str | Path, **kwargs: Any ) -> transcript_model.Transcript: """ Transcribe audio from file and return a Transcript model. Parameters ---------- file_uri: Union[str, Path] The uri to the audio file or caption file to transcribe. kwargs: Any Any extra kwargs to use in this model's transcribe function. Returns ------- outputs: transcript_model.Transcript The transcript model for the supplied media file. """
@staticmethod def _clean_word(word: str) -> str: cleaned_word = re.sub(r"[^\w\/\-\']+", "", word).lower() return cleaned_word