Python ComputerVisionClient.recognize_printed_text 예제들

프로그래밍 언어: Python

네임스페이스/패키지 이름: azure.cognitiveservices.vision.computervision

클래스/타입: ComputerVisionClient

메소드/함수: recognize_printed_text

hotexamples.com에서의 예제들: 2

Python ComputerVisionClient.recognize_printed_text - 2개의 예제가 발견되었습니다. 이것들은 오픈소스 프로젝트에서 추출된 Python의 azure.cognitiveservices.vision.computervision.ComputerVisionClient.recognize_printed_text에 대한 실세계 최고 등급의 예제들입니다. 예제들을 평가하여 예제의 품질 향상에 도움을 줄 수 있습니다.

자주 사용되는 메소드들

보기 숨기기

ComputerVisionClient(30)

analyze_image(19)

get_read_result(14)

describe_image(12)

analyze_image_in_stream(12)

detect_objects_in_stream(11)

read(10)

describe_image_in_stream(9)

read_in_stream(9)

batch_read_file_in_stream(7)

detect_objects(6)

get_read_operation_result(6)

analyze_image_by_domain(6)

batch_read_file(5)

analyze_image_by_domain_in_stream(4)

generate_thumbnail_in_stream(3)

generate_thumbnail(2)

recognize_printed_text(2)

get_text_operation_result(1)

list_models(1)

예제 #1

파일 보기

파일: ComputerVisionQuickstart.py 프로젝트: pranabenator/cognitive-services-quickstart-code

local_image = open(local_image_path, "rb")

print("\nRecognizing printed text with OCR on a local image ...\n")
ocr_result = computervision_client.recognize_printed_text_in_stream(
    local_image)
for region in ocr_result.regions:
    for line in region.lines:
        print("Bounding box: {}".format(line.bounding_box))
        s = ""
        for word in line.words:
            s += word.text + " "
        print(s + "\n")
#   END - Recognize printed text with OCR in a local image

# Recognize printed text with OCR in a remote image by:
#   1. Calling the Computer Vision service's recognize_printed_text with the:
#      - image
#   2. Displaying the lines of text and their bounding boxes.
remote_image_url = "https://raw.githubusercontent.com/Azure-Samples/cognitive-services-sample-data-files/master/ComputerVision/Images/printed_text.jpg"

print("\nRecognizing printed text with OCR on a remote image ...\n")
ocr_result = computervision_client.recognize_printed_text(remote_image_url)
for region in ocr_result.regions:
    for line in region.lines:
        print("Bounding box: {}".format(line.bounding_box))
        s = ""
        for word in line.words:
            s += word.text + " "
        print(s + "\n")
#   END - Recognize printed text with OCR in a remote image

예제 #2

파일 보기

class ImageExtractor(BaseExtractor):
    """
    This does Object Character Recognition (OCR) using Azure Computer Vision Service
    """

    vision_client = None

    def __init__(self):
        try:
            credentials = CognitiveServicesCredentials(key)
            self.vision_client = ComputerVisionClient(
                endpoint="https://" + region + ".api.cognitive.microsoft.com/",
                credentials=credentials,
            )
        except Exception as e:
            log.warning(
                f"Can't init Azure ComputerVisionClient (make sure env vars are correct): {str(e)}"
            )
            self.vision_client = None

    def _extract_text_from_image(self,
                                 filename_or_url: str,
                                 language: str = "en"):
        # url = "https://upload.wikimedia.org/wikipedia/commons/thumb/1/12/Broadway_and_Times_Square_by_night.jpg/450px-Broadway_and_Times_Square_by_night.jpg"
        # API docs: https://azuresdkdocs.blob.core.windows.net/$web/python/azure-cognitiveservices-vision-computervision/0.7.0/azure.cognitiveservices.vision.computervision.models.html#azure.cognitiveservices.vision.computervision.models.OcrResult

        # Raw response from Azure Cognitive Service
        ocr_result: OcrResult = None

        if os.path.isfile(filename_or_url):
            # Process a local file
            local_image = open(filename_or_url, "rb")
            ocr_result = self.vision_client.recognize_printed_text_in_stream(
                local_image, detect_orientation=True, language="unk")
        else:
            # Process a public URL
            ocr_result = self.vision_client.recognize_printed_text(
                url=filename_or_url, detect_orientation=True, language="unk")

        # Transfer all data into meta

        meta = {
            "language": ocr_result.language,
            "text_angle": ocr_result.text_angle,
            "orientation": ocr_result.orientation,
        }

        # TODO improve word list w. medical dictionary + more languages.
        # FIXME: not very good results right now
        spellcheck = Spellchecker(language=ocr_result.language)

        # Now extract the text from all regions
        fulltext = ""
        for region in ocr_result.regions:
            # print("Bounding box: {}".format(region.bounding_box))
            for line in region.lines:
                # print("Bounding box: {}".format(line.bounding_box))
                for word in line.words:
                    corrected = spellcheck.correct_word(word.text)
                    if corrected != word.text:
                        log.debug(
                            f"auto-corrected word: {word.text} -> {corrected}")
                    fulltext += corrected + " "
                fulltext += "\n"
            fulltext += "\n\n"

        # Return mutiple values
        return fulltext, meta

    def can_handle(self, request: ExtractorRequest) -> bool:
        if not self.vision_client:
            log.warn(
                "Can't handle input, as the Azure Computer Vision Client hasn't been initialized"
            )
            return False

        return (request.url and _is_supported_content_type(request.url)) or (
            request.filename and _is_supported_content_type(request.filename))

    def extract(self, request: ExtractorRequest) -> ExtractorResponse:
        log.info(f"Extracting text from image (Azure Computer Vision OCR) ...")

        try:
            if request.url:
                fulltext, meta = self._extract_text_from_image(request.url)
            else:
                fulltext, meta = self._extract_text_from_image(
                    request.filename)
            # TODO get some meta data as well
            meta = {**meta, **{"source": "image", "extractor": "az-vision"}}

            return ExtractorResponse(text=fulltext, meta=meta)
        except Exception as e:
            msg = f"Error extracting text using Azure Computer Vision: '{str(e)}'"
            log.error(msg)
            return ExtractorResponse(error=msg)