Python Document.from_json 예제들

프로그래밍 언어: Python

네임스페이스/패키지 이름: models.document

클래스/타입: Document

메소드/함수: from_json

hotexamples.com에서의 예제들: 10

Python Document.from_json - 10개의 예제가 발견되었습니다. 이것들은 오픈소스 프로젝트에서 추출된 Python의 models.document.Document.from_json에 대한 실세계 최고 등급의 예제들입니다. 예제들을 평가하여 예제의 품질 향상에 도움을 줄 수 있습니다.

자주 사용되는 메소드들

보기 숨기기

Document(30)

from_json(6)

path(5)

getkey(4)

save(4)

query(4)

text(3)

open(3)

updated_at(2)

to_dict(2)

tags(2)

partner(2)

new(2)

name(2)

meta(2)

value(2)

get_revision_by_timestamp(2)

date(2)

htmlcontent(1)

put(1)

clone(1)

csscontent(1)

documentName(1)

elastic_score(1)

get_by_dates(1)

process_document(1)

account(1)

get_by_page(1)

get_content(1)

get_id(1)

newname(1)

get_latest_revision(1)

get_title(1)

key(1)

예제 #1

파일 보기

 def from_dict(d):
     """
     Convert dict representation to MatchSet
     :param d: dict representation of a MatchSet
     :return: MatchSet
     """
     matches = [Match.from_dict(m) for m in d['matches']]
     alpha = Document.from_json(d['alpha_doc'])
     beta = Document.from_json(d['beta_doc'])
     return MatchSet(alpha_doc=alpha,
                     beta_doc=beta,
                     matches=matches)

예제 #2

파일 보기

파일: DIRT.py 프로젝트: gnarph/DIRT

def process_parallel_worker(a, output_dir, gap_length, match_length, b, comparator):
    """
    Worker for processing two files at a time in parallel
    """
    comparator_path = COMPARATOR_PATH.format(comparator)
    comparator = importlib.import_module(comparator_path)
    pro = processor.Processor(output_dir=output_dir,
                              comparator=comparator,
                              gap_length=gap_length,
                              match_length=match_length,
                              percentage_match_length=None)
    alpha = Document.from_json(a)
    beta = Document.from_json(b)
    pro.process(alpha_document=alpha, beta_document=beta)

예제 #3

파일 보기

def process_parallel_worker(a, output_dir, gap_length, match_length, b,
                            comparator):
    """
    Worker for processing two files at a time in parallel
    """
    comparator_path = COMPARATOR_PATH.format(comparator)
    comparator = importlib.import_module(comparator_path)
    pro = processor.Processor(output_dir=output_dir,
                              comparator=comparator,
                              gap_length=gap_length,
                              match_length=match_length,
                              percentage_match_length=None)
    alpha = Document.from_json(a)
    beta = Document.from_json(b)
    pro.process(alpha_document=alpha, beta_document=beta)

예제 #4

파일 보기

파일: DIRT.py 프로젝트: gnarph/DIRT

def process_serial(args, alpha_files, beta_files):
    """
    Process on a single thread
    """
    comparator_path = COMPARATOR_PATH.format(args.comparator)
    comparator = importlib.import_module(comparator_path)
    pro = processor.Processor(output_dir=args.output_dir,
                              comparator=comparator,
                              gap_length=args.gap_length,
                              match_length=args.match_length,
                              percentage_match_length=None)
    compared = []
    for a, b in itertools.product(alpha_files, beta_files):
        this_set = sorted([a, b])
        if a != b and this_set not in compared:
            alpha = Document.from_json(a)
            beta = Document.from_json(b)
            pro.process(alpha_document=alpha, beta_document=beta)
            compared.append(this_set)
    return len(compared)

예제 #5

파일 보기

def process_serial(args, alpha_files, beta_files):
    """
    Process on a single thread
    """
    comparator_path = COMPARATOR_PATH.format(args.comparator)
    comparator = importlib.import_module(comparator_path)
    pro = processor.Processor(output_dir=args.output_dir,
                              comparator=comparator,
                              gap_length=args.gap_length,
                              match_length=args.match_length,
                              percentage_match_length=None)
    compared = []
    for a, b in itertools.product(alpha_files, beta_files):
        this_set = sorted([a, b])
        if a != b and this_set not in compared:
            alpha = Document.from_json(a)
            beta = Document.from_json(b)
            pro.process(alpha_document=alpha, beta_document=beta)
            compared.append(this_set)
    return len(compared)

예제 #6

파일 보기

파일: tests.py 프로젝트: gnarph/DIRT

    def setUp(self):
        self.passages_a = [chr(i + ord('a')) for i in xrange(10)]
        self.passages_b = [chr(i + ord('A')) for i in xrange(10)]
        self.file_a = 'models/test_data/match_set_test.json'
        self.document_a = Document.from_json(self.file_a)
        self.file_b = 'models/test_data/match_set_test2.json'
        self.document_b = Document.from_json(self.file_b)

        self.matches = []
        self.singlet_pairs = []
        for i in xrange(len(self.passages_a)):
            a = MatchHalf(passage=self.passages_a[i])
            b = MatchHalf(passage=self.passages_b[i])
            s_pair = (a, b)
            self.singlet_pairs.append(s_pair)
            # Alpha/beta need to be actual documents, not names
        self.matches = Processor.singlet_pairs_to_matches(alpha=self.document_a,
                                                          beta=self.document_b,
                                                          singlet_pairs=self.singlet_pairs)
        self.match_set = MatchSet(alpha_doc=self.document_a,
                                  beta_doc=self.document_b,
                                  matches=self.matches)

예제 #7

파일 보기

파일: tests.py 프로젝트: gnarph/DIRT

    def setUp(self):
        self.passages_a = [chr(i + ord('a')) for i in xrange(10)]
        self.passages_b = [chr(i + ord('A')) for i in xrange(10)]
        self.file_a = 'models/test_data/match_set_test.json'
        self.document_a = Document.from_json(self.file_a)
        self.file_b = 'models/test_data/match_set_test2.json'
        self.document_b = Document.from_json(self.file_b)

        self.matches = []
        self.singlet_pairs = []
        for i in xrange(len(self.passages_a)):
            a = MatchHalf(passage=self.passages_a[i])
            b = MatchHalf(passage=self.passages_b[i])
            s_pair = (a, b)
            self.singlet_pairs.append(s_pair)
            # Alpha/beta need to be actual documents, not names
        self.matches = Processor.singlet_pairs_to_matches(
            alpha=self.document_a,
            beta=self.document_b,
            singlet_pairs=self.singlet_pairs)
        self.match_set = MatchSet(alpha_doc=self.document_a,
                                  beta_doc=self.document_b,
                                  matches=self.matches)

예제 #8

파일 보기

 def test_read(self):
     """
     Test reading of TEI xml file
     """
     real_data_file = self._get_test_file_name(TEI_ZHI)
     tei_doc = tei_document.TEIDocument(real_data_file)
     tei_data = tei_doc.get_data()
     tei_body = tei_data['body']
     r = reader.TEIReader(real_data_file)
     read_body, read_metadata = r.read()
     self.assertEqual(tei_body, read_body)
     json_name = self._get_test_file_name(JSON_ZHI)
     global_doc = Document.from_json(json_name)
     self.assertEqual(read_body, global_doc.raw_body)
     self.assertEqual(read_metadata, global_doc.metadata)

예제 #9

파일 보기

파일: tests.py 프로젝트: gnarph/DIRT

 def test_read(self):
     """
     Test reading of TEI xml file
     """
     real_data_file = self._get_test_file_name(TEI_ZHI)
     tei_doc = tei_document.TEIDocument(real_data_file)
     tei_data = tei_doc.get_data()
     tei_body = tei_data['body']
     r = reader.TEIReader(real_data_file)
     read_body, read_metadata = r.read()
     self.assertEqual(tei_body, read_body)
     json_name = self._get_test_file_name(JSON_ZHI)
     global_doc = Document.from_json(json_name)
     self.assertEqual(read_body, global_doc.raw_body)
     self.assertEqual(read_metadata, global_doc.metadata)

예제 #10

파일 보기

 def test_smoke(self):
     """
     Smoke test - check that the preprocessor runs without exploding
     """
     pp = Preprocessor(file_name=self.file_name,
                       input_dir=self.input_dir,
                       output_dir=self.output_dir)
     pp.process()
     out_dir_files = os.listdir(self.output_dir)
     for file_name in out_dir_files:
         name = utilities.path.get_name(self.file_name,
                                        extension=False)
         if name in file_name:
             file_path = os.path.join(self.output_dir, file_name)
             doc = Document.from_json(file_path)
             self.assertNotEqual(doc.pre_file_name, self.file_name)
             self.assertEqual(doc.file_name, 'test_preprocessed/lorem.json')