Source code for audiomate.corpus.io.free_spoken_digits

import os
import glob

import audiomate
from audiomate import annotations
from audiomate import issuers
from . import base
from . import downloader

MASTER_DOWNLOAD_URL = 'https://github.com/Jakobovski/free-spoken-digit-dataset/archive/master.zip'


[docs]class FreeSpokenDigitDownloader(downloader.ArchiveDownloader):
    """
    Downloader for the Free-Spoken-Digit dataset.

    Args:
        url (str): The url to download the dataset from. If not given the default URL is used.
                   It is expected to be a zip file.
    """

    def __init__(self, url=None):
        if url is None:
            url = MASTER_DOWNLOAD_URL

        super(FreeSpokenDigitDownloader, self).__init__(
            url,
            move_files_up=True
        )

[docs]    @classmethod
    def type(cls):
        return 'free-spoken-digits'


[docs]class FreeSpokenDigitReader(base.CorpusReader):
    """
    Reader for the Free-Spoken-Digit Corpus.

    .. seealso::

       `Free-Spoken-Digit-Dataset <https://github.com/Jakobovski/free-spoken-digit-dataset>`_
          Download page
    """

[docs]    @classmethod
    def type(cls):
        return 'free-spoken-digits'

    def _check_for_missing_files(self, path):
        recordings_folder = os.path.join(path, 'recordings')

        if os.path.isdir(recordings_folder):
            return []
        else:
            return [recordings_folder]

    def _load(self, path):
        corpus = audiomate.Corpus(path=path)

        for file_path in glob.glob(os.path.join(path, 'recordings', '*.wav')):
            file_idx = os.path.splitext(os.path.basename(file_path))[0]

            corpus.new_file(file_path, file_idx)

            idx_parts = file_idx.split('_')
            digit = idx_parts[0]
            issuer_idx = '_'.join(idx_parts[1:-1])

            if issuer_idx not in corpus.issuers.keys():
                issuer = issuers.Speaker(issuer_idx)
                corpus.import_issuers(issuer)

            utterance = corpus.new_utterance(file_idx, file_idx, issuer_idx)
            utterance.set_label_list(annotations.LabelList.create_single(str(digit),
                                                                         idx=audiomate.corpus.LL_WORD_TRANSCRIPT))

        return corpus