Python DataHandler Examples

Programming Language: Python

Namespace/Package Name: genenet

Method/Function: DataHandler

Examples at hotexamples.com: 4

Python DataHandler - 4 examples found. These are the top rated real world Python examples of genenet.DataHandler extracted from open source projects. You can rate examples to help us improve the quality of examples.

Example #1

Show file

def create_network(instance_settings: Dict[str, Any]) -> \
        Tuple[gn.GeneNet, Dict[str, Any], Dict[str, Any]]:
    """Create a TensorFlow computation graph to train the U-Net on the
    platelet segmentation task.

    Args:
        instance_settings (Dict[str, Any]): Dictionary of example instance_settings that controls
            the creation and training of a TensorFlow network.

    Returns:
        net (gn.GeneNet): An in-lab wrapper around a TensorFlow computation
            graph that implements training, eval, and inference with a
            segmentation neural network.
        train_settings (Dict[str, Any]): Settings for training `net`.
        eval_settings (Dict[str, Any]): Settings for evaluating `net`.
    """
    # See 'example1_train_unet.ipynb' for setting definitions
    data_dir = instance_settings['data_dir']
    instance_dir = instance_settings['instance_dir']
    input_shape = instance_settings['input_shape']
    n_epochs = instance_settings['n_epochs']
    stop_criterion = instance_settings['stop_criterion']
    weight_seed = instance_settings['weight_seed']
    data_seed = instance_settings['data_seed']
    train_window_spacing = instance_settings['train_window_spacing']
    net_settings = instance_settings['net_settings']
    optim_settings = instance_settings['optim_settings']

    # Create a DataHandler, load data
    data_handler = gn.DataHandler(
        train_data_dir=data_dir,
        train_file='train-images.tif',
        train_label_file='train-labels.tif',
        train_weight_file='train-error-weights.tif',
        eval_file='eval-images.tif',
        eval_label_file='eval-labels.tif')

    # Create a GeneGraph for an encoder-decoder segmentation network
    gene_graph = gn.gene_graph(input_shape,
                               data_handler.n_classes,
                               net_settings=net_settings,
                               predictor_settings={},
                               optim_settings=optim_settings)

    # Image summary instance_settings
    image_settings = [
        ('input', {}),
        ('classes', {'cmap': 'jet', 'vmin': 0,
                     'vmax': data_handler.n_classes}),
        ('probabilities', {'cmap': 'pink', 'vmin': 0, 'vmax': 1})
    ]

    # Create a GeneNet
    net = gn.GeneNet(gene_graph,
                     name='U-Net',
                     save_dir=instance_dir,
                     param_seed=weight_seed,
                     image_settings=image_settings)

    # Media directory
    eval_media_dir = os.path.join(instance_dir, 'media')
    os.makedirs(eval_media_dir, exist_ok=True)
 
    # Network snapshot info. Create images on the eval volume.
    sample_image = data_handler.eval_volume
    sample_label = data_handler.eval_label_volume
    image_cmaps = {'data': 'gray',
                   'segmentation': 'jet',
                   'prob_maps': 'pink'}

    # Package training info into a dict
    train_settings = {
        'data_handler': data_handler,
        'n_epochs': n_epochs,
        'max_steps': None,
        'stop_criterion': stop_criterion,
        'data_seed': data_seed,
        'window_spacing': train_window_spacing
    }

    # Package eval and media generation info into a dict
    eval_settings = {
        'instance_dir': instance_dir,
        'eval_media_dir': eval_media_dir,
        'sample_image': sample_image,
        'sample_label': sample_label,
        'image_cmaps': image_cmaps
    }

    return net, train_settings, eval_settings

Example #2

Show file

def segment_better(
    net_dirs: Union[str, List[str]],
    image_file: str,
    label_file: str,
    save_dir: str,
    device: Optional[str] = None
) -> Union[np.ndarray, Tuple[np.ndarray, np.ndarray]]:
    """

    Args:
        net_dirs:
        image_file:
        label_file:
        save_dir:
        device:

    Returns:

    """
    if isinstance(net_dirs, str):
        net_dirs = [net_dirs]

    eval_dir = os.path.dirname(image_file)
    image_name = os.path.basename(image_file)
    label_rel_name = os.path.relpath(label_file, eval_dir)
    data_handler = gn.DataHandler(eval_data_dir=eval_dir,
                                  eval_file=image_name,
                                  eval_label_file=label_rel_name)
    data_vol = data_handler.eval_volume

    image_cmaps = {'data': 'gray', 'segmentation': 'jet', 'prob_maps': 'pink'}
    save_name = 'prediction.tif'

    ndim_data = data_vol.ndim

    all_prob_maps = []
    for source in net_dirs:
        if isinstance(source, str):
            ckpt_dir = os.path.join(source, 'model', 'checkpoints', 'best')
            net = lab.restore_from_checkpoint(source, ckpt_dir, device)
        else:
            net = source

        print(f'Net input shape: {net.gene_graph.input_shape}. '
              f'Net output shape: {net.gene_graph.output_shape()}')

        output_shape = net.gene_graph.output_shape()
        net_is_3d = len(output_shape) == 3
        # Shape of the segmentation volume is same as data volume if
        # single-channel, else ignore the channel dimension
        if ndim_data > 3:
            vol_shape = data_vol.shape[1:]
        else:
            vol_shape = data_vol.shape
        # Initialize the volumes
        # segmentation = np.zeros(vol_shape)
        # Shape of the probability map volume: one map per class
        prob_shape = [data_handler.n_classes] + list(vol_shape)
        prob_maps = np.zeros(prob_shape)
        prob_map_update_dist = np.zeros(vol_shape, dtype=np.int)
        # Create an input_fn
        # Check if SAME padding is used
        gene0 = list(net.gene_graph.genes.items())[0][1]
        padding = gene0.hyperparam('padding_type')
        if padding.lower() == 'same':
            forward_window_overlap = [1] * (3 - len(output_shape)) + [
                s // 3 for s in output_shape
            ]
        else:
            forward_window_overlap = [0] * 3

        predict_input_fn = data_handler.input_fn(
            mode=tf.estimator.ModeKeys.PREDICT,
            graph_source=net,
            forward_window_overlap=forward_window_overlap,
            prediction_volume=data_vol)
        # Inference pass result generator
        results: Iterator[Dict[str,
                               np.ndarray]] = net.predict(predict_input_fn)

        # TODO: pass that distance scale triplet as a parameter instead of hard-coding
        if net_is_3d:
            distance_scale = (4, 1, 1)
        else:
            distance_scale = (1, 1)

        for r in results:
            patch_prob = r['probabilities']
            patch_dist = memoized_distance_transform(patch_prob.shape[1:],
                                                     distance_scale)
            patch_corner = r['corner']
            if net_is_3d:
                z0 = patch_corner[0]
                z1 = z0 + output_shape[0]
                x0 = patch_corner[1]
                x1 = x0 + output_shape[1]
                y0 = patch_corner[2]
                y1 = y0 + output_shape[2]

                prev_update_dist = prob_map_update_dist[z0:z1, x0:x1, y0:y1]
                prev_prob = prob_maps[:, z0:z1, x0:x1, y0:y1]

                parts_to_update = prev_update_dist < patch_dist

                prev_prob[:, parts_to_update] = patch_prob[:, parts_to_update]
                prob_maps[:, z0:z1, x0:x1, y0:y1] = prev_prob

                prev_update_dist[parts_to_update] = patch_dist[parts_to_update]
                prob_map_update_dist[z0:z1, x0:x1, y0:y1] = prev_update_dist
            else:
                z0 = patch_corner[0]
                x0 = patch_corner[1]
                x1 = x0 + output_shape[0]
                y0 = patch_corner[2]
                y1 = y0 + output_shape[1]
                if ndim_data > 2:
                    prev_update_dist = prob_map_update_dist[z0, x0:x1, y0:y1]
                    prev_prob = prob_maps[:, z0, x0:x1, y0:y1]

                    parts_to_update = prev_update_dist < patch_dist

                    prev_prob[:, parts_to_update] = patch_prob[:,
                                                               parts_to_update]
                    prob_maps[:, z0, x0:x1, y0:y1] = prev_prob

                    prev_update_dist[parts_to_update] = patch_dist[
                        parts_to_update]
                    prob_map_update_dist[z0, x0:x1, y0:y1] = prev_update_dist
                else:
                    prev_update_dist = prob_map_update_dist[x0:x1, y0:y1]
                    prev_prob = prob_maps[:, x0:x1, y0:y1]

                    parts_to_update = prev_update_dist < patch_dist

                    prev_prob[:, parts_to_update] = patch_prob[:,
                                                               parts_to_update]
                    prob_maps[:, x0:x1, y0:y1] = prev_prob

                    prev_update_dist[parts_to_update] = patch_dist[
                        parts_to_update]
                    prob_map_update_dist[x0:x1, y0:y1] = prev_update_dist

        all_prob_maps.append(prob_maps)

    prob_map_mean = np.mean(all_prob_maps, axis=0)
    segmentation = np.argmax(prob_map_mean, axis=0)

    def tif_cmap(c):
        """Convert a matplotlib colormap into a tifffile colormap.

        """
        a = plt.get_cmap(c)(np.arange(256))
        return np.swapaxes(255 * a, 0, 1)[0:3, :].astype('u1')

    # Save a bunch of images, if `save_dir` was supplied
    if save_dir is not None:
        # Create a data volume image
        # For multichannel 3D data, only use the first channel, under the
        # assumption that that is actual image data
        # TODO: Find a more robust solution for multichannel data
        if ndim_data == 4:
            data_vol = data_vol[0, ...]
        # Generate a file name and path
        data_fname = f'train-data.tif'
        data_fpath = os.path.join(save_dir, data_fname)
        # Create a colormap compatible with tifffile's save function
        data_tcmap = tif_cmap(image_cmaps['data'])

        # Convert data volume to the right type
        data_image = (255. * (data_vol - data_vol.min()) /
                      (data_vol.max() - data_vol.min())).astype(np.uint8)
        # Save
        tif.imsave(data_fpath, data_image, colormap=data_tcmap)

        # Create a segmentation volume image
        # Generate a file name and path
        seg_fname = f'segmentation_{save_name}.tif'
        seg_fpath = os.path.join(save_dir, seg_fname)
        # Create a colormap compatible with tifffile's save function
        seg_tcmap = tif_cmap(image_cmaps['segmentation'])
        # Convert and scale the segmentation volume
        seg_image = (255. / (data_handler.n_classes - 1) *
                     segmentation).astype(np.uint8)
        # Save
        tif.imsave(seg_fpath, seg_image, colormap=seg_tcmap, compress=7)

    return segmentation

Example #3

Show file

def segment(net_sources: Union[gn.GeneNet, str, List[str]],
            image_source: Union[np.ndarray, str],
            output_dir: Optional[str] = None,
            label_source: Optional[Union[np.ndarray, str]] = None,
            device: Optional[str] = None) -> Tuple[np.ndarray, np.ndarray]:
    """

    Args:
        net_sources (Union[gn.GeneNet, str, List[str]]): A GeneNet or one or more
            paths to directories containing saved model files. If more than one
            source is supplied, the resulting segmentation is an ensemble of the
            outputs from each source.
        image_source (Union[np.ndarray, str]): Either an image as a numpy array,
            or a path to a saved image. This image is segmented by the net(s).
        output_dir (Optional[str]): Directory for saving the output of the segmentation
            process, if supplied.
        label_source (Optional[Union[np.ndarray, str]]):
        device:

    Returns:
        segmentation (np.ndarray): Segmentation of `image_source`'s image. Has
            the same shape as the image.
        prob_maps (np.ndarray): Per-voxel probability maps for each class across
            the input image. `prob_maps[i, ...]` is the per-voxel probability
            map for class `i`, and has the same shape as the input image.

    """
    if isinstance(net_sources, str) or isinstance(net_sources, gn.GeneNet):
        net_sources = [net_sources]

    if label_source and type(image_source) != type(label_source):
        raise TypeError('label_source must have same type as image_source if'
                        ' supplied')

    if isinstance(image_source, str):
        eval_dir = os.path.dirname(image_source)
        image_file = os.path.basename(image_source)
        if label_source:
            label_rel_name = os.path.relpath(label_source, eval_dir)
        else:
            label_rel_name = None
    else:
        eval_dir = None
        image_file = image_source
        if label_source:
            label_rel_name = label_source

    data_handler = gn.DataHandler(eval_data_dir=eval_dir,
                                  eval_file=image_file,
                                  eval_label_file=label_rel_name)
    data_vol = data_handler.eval_volume

    image_cmaps = {'data': 'gray', 'segmentation': 'jet', 'prob_maps': 'pink'}
    save_name = 'prediction.tif'

    ndim_data = data_vol.ndim

    all_prob_maps = []
    for source in net_sources:
        if isinstance(source, str):
            ckpt_dir = os.path.join(source, 'model', 'checkpoints', 'best')
            net = lab.restore_from_checkpoint(source, ckpt_dir, device)
        else:
            net = source

        print(f'Net input shape: {net.gene_graph.input_shape}. '
              f'Net output shape: {net.gene_graph.output_shape()}')

        output_shape = net.gene_graph.output_shape()
        net_is_3d = len(output_shape) == 3
        # Shape of the segmentation volume is same as data volume if
        # single-channel, else ignore the channel dimension
        if ndim_data > 3:
            vol_shape = data_vol.shape[1:]
        else:
            vol_shape = data_vol.shape
        # Initialize the volumes
        # segmentation = np.zeros(vol_shape)
        # Shape of the probability map volume: one map per class
        prob_shape = [data_handler.n_classes] + list(vol_shape)
        print(prob_shape)
        prob_maps = np.zeros(prob_shape)
        prob_map_update_dist = np.zeros(vol_shape, dtype=np.int)
        # Create an input_fn
        # Check if SAME padding is used
        gene0 = list(net.gene_graph.genes.items())[0][1]
        padding = gene0.hyperparam('padding_type')
        is_same_padded = padding.lower() == 'same'
        if is_same_padded:
            forward_window_overlap = [1] * (3 - len(output_shape)) + [
                s // 3 for s in output_shape
            ]
        else:
            forward_window_overlap = [0] * 3

        predict_input_fn = data_handler.input_fn(
            mode=tf.estimator.ModeKeys.PREDICT,
            graph_source=net,
            forward_window_overlap=forward_window_overlap,
            prediction_volume=data_vol)
        # Inference pass result generator
        results: Iterator[Dict[str,
                               np.ndarray]] = net.predict(predict_input_fn)

        # TODO: pass that distance scale triplet as a parameter instead of hard-coding
        if net_is_3d:
            distance_scale = (4, 1, 1)
        else:
            distance_scale = (1, 1)

        for r in results:
            patch_prob = r['probabilities']
            patch_dist = memoized_distance_transform(patch_prob.shape[1:],
                                                     distance_scale)
            patch_corner = r['corner']

            if net_is_3d:
                z0 = patch_corner[0]
                z1 = z0 + output_shape[0]
                x0 = patch_corner[1]
                x1 = x0 + output_shape[1]
                y0 = patch_corner[2]
                y1 = y0 + output_shape[2]
                region = (slice(z0, z1), slice(x0, x1), slice(y0, y1))
            else:
                z0 = patch_corner[0]
                x0 = patch_corner[1]
                x1 = x0 + output_shape[0]
                y0 = patch_corner[2]
                y1 = y0 + output_shape[1]
                if ndim_data > 2:
                    region = (slice(z0, z0 + 1), slice(x0, x1), slice(y0, y1))
                else:
                    region = (slice(x0, x1), slice(y0, y1))

            if is_same_padded:
                parts_to_update = prob_map_update_dist[region] < patch_dist

                padded_parts_to_update = np.zeros_like(prob_map_update_dist,
                                                       dtype=np.bool)
                padded_parts_to_update[region] = parts_to_update

                prob_maps[:,
                          padded_parts_to_update] = patch_prob[:,
                                                               parts_to_update]
                prob_map_update_dist[padded_parts_to_update] = patch_dist[
                    parts_to_update]
            else:
                if net_is_3d:
                    prob_maps[:, z0:z1, x0:x1, y0:y1] = patch_prob
                else:
                    if ndim_data > 2:
                        prob_maps[:, z0, x0:x1, y0:y1] = patch_prob
                    else:
                        prob_maps[:, x0:x1, y0:y1] = patch_prob

        all_prob_maps.append(prob_maps)

    prob_map_mean = np.mean(all_prob_maps, axis=0)
    segmentation = np.argmax(prob_map_mean, axis=0)

    def tif_cmap(c):
        """Convert a matplotlib colormap into a tifffile colormap.

        """
        a = plt.get_cmap(c)(np.arange(256))
        return np.swapaxes(255 * a, 0, 1)[0:3, :].astype('u1')

    # Save a bunch of images, if `save_dir` was supplied
    if output_dir is not None:
        # Create a data volume image
        # For multichannel 3D data, only use the first channel, under the
        # assumption that that is actual image data
        # TODO: Find a more robust solution for multichannel data
        if ndim_data == 4:
            data_vol = data_vol[0, ...]
        # Generate a file name and path
        data_fname = f'train-data.tif'
        data_fpath = os.path.join(output_dir, data_fname)
        # Create a colormap compatible with tifffile's save function
        data_tcmap = tif_cmap(image_cmaps['data'])

        # Convert data volume to the right type
        data_image = (255. * (data_vol - data_vol.min()) /
                      (data_vol.max() - data_vol.min())).astype(np.uint8)
        # Save
        tif.imsave(data_fpath, data_image, colormap=data_tcmap)

        # Create a segmentation volume image
        # Generate a file name and path
        seg_fname = save_name
        seg_fpath = os.path.join(output_dir, seg_fname)
        # Create a colormap compatible with tifffile's save function
        seg_tcmap = tif_cmap(image_cmaps['segmentation'])
        # Convert and scale the segmentation volume
        seg_image = (255. / (data_handler.n_classes - 1) *
                     segmentation).astype(np.uint8)
        # Save
        tif.imsave(seg_fpath, seg_image, colormap=seg_tcmap, compress=7)

    return segmentation, prob_map_mean

Example #4

Show file

def evaluate(net_dir: str,
             image_file: str,
             label_file: Optional[str] = None,
             checkpoint_dir: Optional[str] = None,
             segmentation_out_tif: Optional[str] = None,
             eval_out_json: Optional[str] = None,
             save_prob_maps: bool = False,
             device: Optional[str] = None) -> Dict[str, Union[float, str]]:
    """

    Args:
        net_dir:
        image_file:
        label_file:
        checkpoint_dir:
        segmentation_out_tif:
        eval_out_json:
        save_prob_maps:
        device:

    Returns:

    """

    do_eval = label_file is not None
    save_image = segmentation_out_tif is not None
    save_eval = eval_out_json is not None
    if save_eval:
        eval_dir = os.path.dirname(eval_out_json)
        if eval_dir != '':
            os.makedirs(eval_dir, exist_ok=True)

    net = restore_from_checkpoint(net_dir, checkpoint_dir, device=device)

    eval_dir = os.path.dirname(image_file)
    image_name = os.path.basename(image_file)
    if do_eval:
        label_rel_name = os.path.relpath(label_file, eval_dir)
        data_handler = gn.DataHandler(eval_data_dir=eval_dir,
                                      eval_file=image_name,
                                      eval_label_file=label_rel_name)
    else:
        data_handler = gn.DataHandler(eval_data_dir=eval_dir,
                                      eval_file=image_name)

    eval_input_fn = data_handler.input_fn(mode=tf.estimator.ModeKeys.EVAL,
                                          graph_source=net.gene_graph)

    eval_results = net.evaluate(eval_input_fn)

    if save_eval:
        with open(eval_out_json, 'w') as fd:
            json.dump(eval_results, fd)

    if save_image:
        # Segmentation coloration info
        image_cmaps = {
            'data': 'gray',
            'segmentation': 'jet',
            'prob_maps': 'pink'
        }

        media_dir = os.path.dirname(segmentation_out_tif)
        os.makedirs(media_dir, exist_ok=True)
        tif_name = os.path.splitext(os.path.basename(segmentation_out_tif))[0]
        gn.segment(net,
                   data_handler=data_handler,
                   data_vol=data_handler.eval_volume,
                   label_vol=data_handler.eval_label_volume,
                   save_dir=media_dir,
                   image_cmaps=image_cmaps,
                   save_name=tif_name,
                   draw_prob_maps=save_prob_maps)

    return eval_results