Source code for polyglotdb.io.inspect.buckeye

from polyglotdb.io.parsers import BuckeyeParser
from polyglotdb.io.types.parsing import OrthographyTier, SegmentTier
from polyglotdb.structure import Hierarchy


[docs] def inspect_buckeye(word_path): """ Generate a :class:`~polyglotdb.io.parsers.buckeye.BuckeyeParser` for the Buckeye corpus. Parameters ---------- word_path : str Full path to text file Returns ------- :class:`~polyglotdb.io.parsers.buckeye.BuckeyeParser` Auto-detected parser for the Buckeye corpus """ annotation_types = [ OrthographyTier("word", "word"), OrthographyTier("transcription", "word"), OrthographyTier("surface_transcription", "word"), OrthographyTier("category", "word"), SegmentTier("phone", "phone"), ] annotation_types[2].type_property = False annotation_types[3].type_property = False hierarchy = Hierarchy({"phone": "word", "word": None}) return BuckeyeParser(annotation_types, hierarchy)