Python get_offsets 예제들

프로그래밍 언어: Python

네임스페이스/패키지 이름: tmdm.util

메소드/함수: get_offsets

hotexamples.com에서의 예제들: 10

Python get_offsets - 10개의 예제가 발견되었습니다. 이것들은 오픈소스 프로젝트에서 추출된 Python의 tmdm.util.get_offsets에 대한 실세계 최고 등급의 예제들입니다. 예제들을 평가하여 예제의 품질 향상에 도움을 줄 수 있습니다.

예제 #1

파일 보기

파일: cached.py 프로젝트: schlevik/tmdm

class Cached(Provider):
    cache: Dict[str, Any]
    name = 'cached'
    known_schemas = {
        # these assume same tokenisation
        "bio":
        lambda doc, annotation: offsets_from_biluo_tags(
            iob_to_biluo(doc, annotation)),
        "bilou":
        offsets_from_biluo_tags,
        "offsets":
        OFFSETS,
        "list_of_clusters":
        convert_clusters_to_offsets,
        # these provide their own tokenisation

        # annotation: List[Tuple[str,str]]
        "list_of_tuples_bio_flat":
        lambda doc, annotation: get_offsets(doc.text, annotation),

        # annotation: List[List[Tuple[str,str]]]
        "list_of_tuples_bio_stacked":
        lambda doc, annotation: get_offsets_from_sentences(
            doc.text, annotation),

        # annotation: Tuple[List[str],List[str]]
        "tuple_of_lists_flat":
        lambda doc, annotation: get_offsets(doc.text, zip(*annotation[:2])),

        # annotation: List[Tuple[List[str]], Tuple[List[str]]]
        "list_of_tuples_of_lists":
        lambda doc, annotation: get_offsets_from_sentences(
            doc.text, ((w, l) for t in annotation for w, l in zip(*t[:2]))),

        # annotation: Tuple[List[List[str]], Tuple[List[List[str]]
        "tuple_of_lists_of_lists":
        lambda doc, annotation: get_offsets_from_sentences(
            doc.text, ((w, l) for ws, ls in zip(*annotation[:2])
                       for w, l in zip(ws, ls)))

        # TODO: BRAT
        # TODO: Pubmed
    }

    def __init__(self,
                 schema: Union[str, Callable[[Doc, Any],
                                             OffsetAnnotation]] = None,
                 getter=None,
                 path: str = None):
        self.cache = {}
        self.loaded = False
        if not schema:
            self.schema = OFFSETS
        elif schema in self.known_schemas:
            self.schema = Cached.known_schemas[schema]
        elif isinstance(schema, Callable):
            self.schema = schema
        else:
            self.schema = None
        self.getter = getter
        if path:
            self.load(path)

    @overrides
    def save(self, path: str):
        util.save_file(self.cache, path)

    # TODO: guess schema

    @overrides
    def load(self, path):
        self.cache = util.load_file(path)
        self.loaded = True

    @overrides
    def annotate_document(self, doc: Doc) -> OffsetAnnotation:
        if not self.loaded:
            raise ValueError("You forgot to load the cache!")
        annotations = self.cache.get(doc._.id, None)
        if annotations:
            if self.schema:
                if self.schema == OFFSETS:
                    return self.getter(
                        annotations) if self.getter else annotations
                else:
                    return self.schema(
                        doc,
                        self.getter(annotations)
                        if self.getter else annotations)
            else:
                logger.info(
                    f"no schema loaded for {self.__class__.__name__}, good luck!"
                )
                return annotations

예제 #2

파일 보기