UsageΒΆ

A simple example of how DanSpeech can be used. For faster inference, use either a less complex model or instantiate the Recognizer with a GPU.

from danspeech import Recognizer
from danspeech.pretrained_models import DanSpeechPrimary
from danspeech.language_models import DSL3gram
from danspeech.audio import load_audio

# Load a DanSpeech model. If the model does not exists, it will be downloaded.
model = DanSpeechPrimary()
recognizer = Recognizer(model=model)

# Load the audio file.

audio = load_audio(path="./example_files/u0013002.wav")
print(recognizer.recognize(audio))

# DanSpeech with a language model.
# Note: Requires ctcdecode to work!
lm = DSL3gram()
recognizer.update_decoder(lm=lm, alpha=1.3, beta=0.15, beam_width=32)
print(recognizer.recognize(audio, show_all=False))