Python Document.buffer 예제들

프로그래밍 언어: Python

네임스페이스/패키지 이름: jina

클래스/타입: Document

메소드/함수: buffer

hotexamples.com에서의 예제들: 8

Python Document.buffer - 8개의 예제가 발견되었습니다. 이것들은 오픈소스 프로젝트에서 추출된 Python의 jina.Document.buffer에 대한 실세계 최고 등급의 예제들입니다. 예제들을 평가하여 예제의 품질 향상에 도움을 줄 수 있습니다.

자주 사용되는 메소드들

보기 숨기기

Document(30)

id(26)

embedding(19)

length(9)

granularity(8)

buffer(8)

modality(6)

parent_id(4)

add_chunk(4)

convert_uri_to_text(3)

convert_uri_to_datauri(3)

convert_uri_to_data_uri(3)

convert_image_blob_to_uri(3)

tags(3)

dict(3)

blob(3)

content(3)

adjacency(3)

score(3)

ParseFromString(2)

from_dict(2)

get_attrs(2)

convert_uri_to_buffer(2)

convert_buffer_to_blob(2)

clear(2)

mime_type(2)

convert_text_to_uri(2)

set_image_blob_normalization(1)

items(1)

set_image_blob_shape(1)

load_uri_to_image_blob(1)

ClearField(1)

from_base64(1)

convert_uri_to_point_cloud_blob(1)

convert_uri_to_image_blob(1)

CopyFrom(1)

convert_image_uri_to_blob(1)

convert_image_datauri_to_blob(1)

convert_image_buffer_to_blob(1)

convert_data_uri_to_blob(1)

convert_content_to_uri(1)

convert_buffer_to_image_blob(1)

convert_buffer_image_to_blob(1)

convert_blob_to_uri(1)

chunks(1)

SerializeToString(1)

convert_uri_to_blob(1)

예제 #1

파일 보기

def create_document(doc_id, text, weight, length):
    d = Document()
    d._document.id = (str(doc_id) * 16)[:16]
    d.buffer = text.encode('utf8')
    d.weight = weight
    d.length = length
    return d

예제 #2

파일 보기

파일: test_pdf_flow.py 프로젝트: strawberrypie/jina-hub

def search_generator(path: str, buffer: bytes):
    d = Document()
    if buffer:
        d.buffer = buffer
    if path:
        d.content = path
    yield d

예제 #3

파일 보기

파일: dataset.py 프로젝트: admariner/examples-1

def input_index_data(num_docs=None, batch_size=8, dataset_type='f30k'):
    captions = 'dataset_flickr30k.json' if dataset_type == 'f30k' else 'captions.txt'
    if dataset_type == 'toy-data':
        base_folder = '.'
    else:
        base_folder = 'data'
    data_loader = get_data_loader(
        root=os.path.join(cur_dir, f'{base_folder}/{dataset_type}/images'),
        captions=os.path.join(cur_dir,
                              f'{base_folder}/{dataset_type}/{captions}'),
        split='test',
        batch_size=batch_size,
        dataset_type=dataset_type)

    for i, (images, captions) in enumerate(data_loader):
        for image, caption in zip(images, captions):
            hashed = hashlib.sha1(image).hexdigest()
            document_img = Document()

            document_img.buffer = image
            document_img.modality = 'image'
            document_img.mime_type = 'image/jpeg'

            document_caption = Document(id=hashed)

            document_caption.text = caption
            document_caption.modality = 'text'
            document_caption.mime_type = 'text/plain'
            document_caption.tags['id'] = caption

            yield document_img
            yield document_caption

        if num_docs and (i + 1) * batch_size >= num_docs:
            break

예제 #4

파일 보기

파일: test_leveldbindexer.py 프로젝트: gandalf012/jina-hub

def create_document(doc_id, text, weight, length):
    d = Document()
    d.id = doc_id
    d.buffer = text.encode('utf8')
    d.weight = weight
    d.length = length
    return d

예제 #5

파일 보기

 def create(self):
     gt = Document()
     if field_type == 'text':
         gt.text = 'aaaa'
     elif field_type == 'buffer':
         gt.buffer = b'\x01\x02\x03\04'
     elif field_type == 'blob':
         gt.blob = np.array([1, 1, 1, 1])
     return gt

예제 #6

파일 보기

 def create(self):
     doc = Document()
     if field_type == 'text':
         doc.text = 'aaa'
     elif field_type == 'buffer':
         doc.buffer = b'\x01\x02\x03'
     elif field_type == 'blob':
         doc.blob = np.array([1, 1, 1])
     return doc

예제 #7

파일 보기

 def request(field_type):
     num_docs = 10
     req = jina_pb2.RequestProto()
     for idx in range(num_docs):
         doc = req.index.docs.add()
         gt = req.index.groundtruths.add()
         chunk_doc = Document(doc.chunks.add())
         chunk_gt = Document(gt.chunks.add())
         chunk_doc.granularity = 1
         chunk_gt.granularity = 1
         if field_type == 'text':
             chunk_doc.text = 'aaa'
             chunk_gt.text = 'aaaa'
         elif field_type == 'buffer':
             chunk_doc.buffer = b'\x01\x02\x03'
             chunk_gt.buffer = b'\x01\x02\x03\x04'
         elif field_type == 'blob':
             chunk_doc.blob = np.array([1, 1, 1])
             chunk_gt.blob = np.array([1, 1, 1, 1])
     return Request(req).as_typed_request('index')

예제 #8

파일 보기

def create_document(doc_id, text, weight):
    d = Document()
    d.id = str(doc_id)
    d.buffer = text.encode('utf8')
    d.weight = weight
    return d