Source code for polyglotdb.corpus.annotated

from .summarized import SummarizedContext

from ..io.importer import (subannotations_data_to_csv, import_subannotation_csv, import_token_csv)



[docs]
class AnnotatedContext(SummarizedContext):
    """
    Class that contains methods for dealing specifically with annotations on linguistic items (termed "subannotations"
    in PolyglotDB
    """
    def import_subannotations(self, data, property_data, subannotation_name, annotation_type):
        if not self.hierarchy.has_subannotation_type(subannotation_name):
            self.hierarchy.add_subannotation_type(self, annotation_type, subannotation_name, properties=property_data)
            self.encode_hierarchy()
        subannotations_data_to_csv(self, subannotation_name, data)
        import_subannotation_csv(self, subannotation_name, annotation_type, ["id", "annotated_id"] + [x[0] for x in property_data])

    def enrich_tokens_with_csv(self, path, annotated_type, id_column, properties=None):
        import_token_csv(self, path, annotated_type, id_column, properties=properties)