Python AsyncInferQueue.AsyncInferQueue Exemples, openvino.runtime.AsyncInferQueue.AsyncInferQueue Python Exemples

Exemple #1

0

Afficher le fichier

    def load_model(self):
        self.compiled_model = self.core.compile_model(self.model, self.device, self.plugin_config)
        self.async_queue = AsyncInferQueue(self.compiled_model, self.max_num_requests)
        if self.max_num_requests == 0:
            # +1 to use it as a buffer of the pipeline
            self.async_queue = AsyncInferQueue(self.compiled_model, len(self.async_queue) + 1)

        log.info('The model {} is loaded to {}'.format("from buffer" if self.model_from_buffer else self.model_path, self.device))
        self.log_runtime_settings()

Exemple #2

0

Afficher le fichier

Fichier : ie_tools.py Projet : bes-dev/open_model_zoo

    def load_model(self,
                   core,
                   model_xml,
                   device,
                   model_type,
                   num_reqs=1,
                   cpu_extension=''):
        """Loads a model in the Inference Engine format"""
        # Plugin initialization for specified device and load extensions library if specified
        if cpu_extension and 'CPU' in device:
            core.add_extension(cpu_extension, 'CPU')
        # Read IR
        log.info('Reading {} model {}'.format(model_type, model_xml))
        self.model = core.read_model(model_xml)

        if len(self.model.inputs) not in self.get_allowed_inputs_len():
            raise RuntimeError(
                "Supports topologies with only {} inputs, but got {}".format(
                    self.get_allowed_inputs_len(), len(self.model.inputs)))
        if len(self.model.outputs) not in self.get_allowed_outputs_len():
            raise RuntimeError(
                "Supports topologies with only {} outputs, but got {}".format(
                    self.get_allowed_outputs_len(), len(self.model.outputs)))

        self.input_tensor_name = self.model.inputs[0].get_any_name()
        self.output_tensor_name = self.model.outputs[0].get_any_name()
        # Loading model to the plugin
        compiled_model = core.compile_model(self.model, device)
        self.infer_queue = AsyncInferQueue(compiled_model, num_reqs)
        self.infer_queue.set_callback(self.completion_callback)
        log.info('The {} model {} is loaded to {}'.format(
            model_type, model_xml, device))

Exemple #3

0

Afficher le fichier

Fichier : benchmark.py Projet : Flex-plaidml-team/openvino

 def create_infer_requests(self, exe_network):
     if self.api_type == 'sync':
         requests = [exe_network.create_infer_request()]
     else:
         requests = AsyncInferQueue(exe_network, self.nireq)
         self.nireq = len(requests)
     return requests

Exemple #4

0

Afficher le fichier

    def __init__(self, model_path, device, core, num_requests, model_type, output_shape=None):
        log.info('Reading {} model {}'.format(model_type, model_path))
        self.model = core.read_model(model_path)

        if len(self.model.inputs) != 1:
            raise RuntimeError("The {} wrapper supports only models with 1 input layer".format(model_type))

        self.outputs = {}
        compiled_model = core.compile_model(self.model, device)
        self.infer_queue = AsyncInferQueue(compiled_model, num_requests)
        self.infer_queue.set_callback(self.completion_callback)
        log.info('The {} model {} is loaded to {}'.format(model_type, model_path, device))

        self.input_tensor_name = self.model.inputs[0].get_any_name()

        if len(self.model.outputs) > 1:
            if output_shape is not None:
                candidates = []
                for output_tensor in self.model.outputs:
                    if len(output_tensor.partial_shape) != len(output_shape):
                        continue

                    if output_tensor.partial_shape[1] == output_shape[1]:
                        candidates.append(output_tensor.get_any_name())

                if len(candidates) != 1:
                    raise RuntimeError("One output is expected")
                self.output_tensor_name = candidates[0]
            else:
                raise RuntimeError("One output is expected")
        else:
            self.output_tensor_name = self.model.outputs[0].get_any_name()

        self.input_size = self.model.input(self.input_tensor_name).shape

Exemple #5

0

Afficher le fichier

def test_results_async_infer(device):
    jobs = 8
    num_request = 4
    core = Core()
    func = core.read_model(test_net_xml, test_net_bin)
    exec_net = core.compile_model(func, device)
    infer_queue = AsyncInferQueue(exec_net, num_request)
    jobs_done = [{"finished": False, "latency": 0} for _ in range(jobs)]

    def callback(request, job_id):
        jobs_done[job_id]["finished"] = True
        jobs_done[job_id]["latency"] = request.latency

    img = read_image()
    infer_queue.set_callback(callback)
    assert infer_queue.is_ready
    for i in range(jobs):
        infer_queue.start_async({"data": img}, i)
    infer_queue.wait_all()

    request = exec_net.create_infer_request()
    outputs = request.infer({0: img})

    for i in range(num_request):
        np.allclose(list(outputs.values()),
                    list(infer_queue[i].results.values()))

Exemple #6

0

Afficher le fichier

 def create_infer_requests(self, compiled_model):
     if self.api_type == 'sync':
         requests = [compiled_model.create_infer_request()]
     else:
         requests = AsyncInferQueue(compiled_model, self.nireq)
         self.nireq = len(requests)
     return requests

Exemple #7

0

Afficher le fichier

 def deploy(self, device, max_requests=1):
     self.max_requests = max_requests
     compiled_model = self.core.compile_model(self.model, device)
     self.output_tensor = compiled_model.outputs[0]
     self.infer_queue = AsyncInferQueue(compiled_model, self.max_requests)
     self.infer_queue.set_callback(self.completion_callback)
     log.info('The {} model {} is loaded to {}'.format(
         self.model_type, self.model_path, device))

Exemple #8

0

Afficher le fichier

Fichier : ie_engine.py Projet : XinWangIntel/openvino

    def _process_dataset_async(self,
                               stats_layout,
                               sampler,
                               print_progress=False,
                               need_metrics_per_sample=False,
                               requests_num=0):
        """Performs model inference on specified dataset subset asynchronously
        :param stats_layout: dict of stats collection functions {node_name: [fn]}(optional)
        :param sampler: sampling dataset to make inference
        :param print_progress: whether to print inference progress
        :param need_metrics_per_sample: whether to collect metrics for each batch
        :param requests_num: number of infer requests
        """
        def completion_callback(request, user_data):
            start_time, batch_id = user_data
            predictions = request.results
            self._process_infer_output(stats_layout, predictions,
                                       batch_annotations, batch_meta,
                                       need_metrics_per_sample)

            # Print progress
            if self._print_inference_progress(progress_log_fn, batch_id,
                                              len(sampler), start_time,
                                              time()):
                start_time = time()

        progress_log_fn = logger.info if print_progress else logger.debug
        self._ie.set_config(
            {
                'CPU_THROUGHPUT_STREAMS': 'CPU_THROUGHPUT_AUTO',
                'CPU_BIND_THREAD': 'YES'
            }, self._device)

        # Load model to the plugin
        compiled_model = self._ie.compile_model(model=self._model,
                                                device_name=self._device)

        optimal_requests_num = compiled_model.get_metric(
            'OPTIMAL_NUMBER_OF_INFER_REQUESTS')
        requests_num = optimal_requests_num if requests_num == 0 else requests_num
        logger.debug('Async mode requests number: %d', requests_num)
        infer_queue = AsyncInferQueue(compiled_model, requests_num)

        progress_log_fn('Start inference of %d images', len(sampler))

        sampler_iter = iter(enumerate(sampler))
        # Start inference
        start_time = time()
        infer_queue.set_callback(completion_callback)
        for batch_id, data_batch in sampler_iter:
            batch_annotations, image_batch, batch_meta = self._process_batch(
                data_batch)
            infer_queue.start_async(
                self._fill_input(compiled_model, image_batch),
                (start_time, batch_id))
        infer_queue.wait_all()
        progress_log_fn('Inference finished')

Exemple #9

0

Afficher le fichier

Fichier : ie_module.py Projet : krodyush/open_model_zoo

 def deploy(self, device, plugin_config, max_requests=1):
     self.max_requests = max_requests
     compiled_model = self.core.compile_model(self.model,
                                              device,
                                              config=plugin_config)
     self.infer_queue = AsyncInferQueue(compiled_model, self.max_requests)
     self.infer_queue.set_callback(self.completion_callback)
     log.info('The {} model {} is loaded to {}'.format(
         self.model_type, self.model_path, device))

Exemple #10

0

Afficher le fichier

Fichier : openvino_launcher.py Projet : vladimir-dudnik/open_model_zoo

 def get_infer_queue(self, log=True):
     if self.config.get('num_requests', 'AUTO') == 'AUTO':
         num_requests = 0
     else:
         num_requests = self.num_requests
     queue = AsyncInferQueue(self.exec_network, num_requests)
     if log:
         print_info('Prepared async infer queue with {} requests'.format(
             len(queue)))
     return queue

Exemple #11

0

Afficher le fichier