Implementation and debugging of InfoOp(Operator) in `colonoscopy_segmentation.py`

mxochicale commented 10 months ago

🚀 Feature

brudfors commented 10 months ago

# SPDX-FileCopyrightText: Copyright (c) 2022-2023 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
# SPDX-License-Identifier: Apache-2.0
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

import os
from argparse import ArgumentParser

from holoscan.core import Application
from holoscan.operators import (
    AJASourceOp,
    FormatConverterOp,
    HolovizOp,
    InferenceOp,
    SegmentationPostprocessorOp,
    VideoStreamReplayerOp,
)
from holoscan.resources import BlockMemoryPool, CudaStreamPool, MemoryStorageType

class InfoOp(Operator):
    """"""

    def __init__(self, *args, **kwargs):
        super().__init__(*args, **kwargs)

    def setup(self, spec: OperatorSpec):
        spec.input("in")
        spec.output("out")

    def compute(self, op_input, op_output, context):
        # Get input message
        in_message = op_input.receive("in")

        # Transpose
        tensor = cp.asarray(in_message.get("")).get()

        # Create output message
        out_message = Entity(context)
        out_message.add(hs.as_tensor(tensor), "")
        op_output.emit(out_message, "out")

class ColonoscopyApp(Application):
    def __init__(self, data, source="replayer"):
        """Initialize the colonoscopy segmentation application

        Parameters
        ----------
        source : {"replayer", "aja"}
            When set to "replayer" (the default), pre-recorded sample video data is
            used as the application input. Otherwise, the video stream from an AJA
            capture card is used.
        """

        super().__init__()

        # set name
        self.name = "Colonoscopy App"

        # Optional parameters affecting the graph created by compose.
        self.source = source

        if data == "none":
            data = os.environ.get("HOLOSCAN_DATA_PATH", "../data")

        self.sample_data_path = data

        self.model_path_map = {
            "ultrasound_seg": os.path.join(self.sample_data_path, "colon.onnx"),
        }

    def compose(self):
        n_channels = 4  # RGBA
        bpp = 4  # bytes per pixel

        cuda_stream_pool = CudaStreamPool(
            self,
            name="cuda_stream",
            dev_id=0,
            stream_flags=0,
            stream_priority=0,
            reserved_size=1,
            max_size=5,
        )

        is_aja = self.source.lower() == "aja"
        if is_aja:
            source = AJASourceOp(self, name="aja", **self.kwargs("aja"))
            drop_alpha_block_size = 1920 * 1080 * n_channels * bpp
            drop_alpha_num_blocks = 2
            drop_alpha_channel = FormatConverterOp(
                self,
                name="drop_alpha_channel",
                pool=BlockMemoryPool(
                    self,
                    storage_type=MemoryStorageType.DEVICE,
                    block_size=drop_alpha_block_size,
                    num_blocks=drop_alpha_num_blocks,
                ),
                cuda_stream_pool=cuda_stream_pool,
                **self.kwargs("drop_alpha_channel"),
            )
        else:
            video_dir = os.path.join(self.sample_data_path)
            if not os.path.exists(video_dir):
                raise ValueError(f"Could not find video data: {video_dir=}")
            source = VideoStreamReplayerOp(
                self, name="replayer", directory=video_dir, **self.kwargs("replayer")
            )

        width_preprocessor = 1350
        height_preprocessor = 1072
        preprocessor_block_size = width_preprocessor * height_preprocessor * n_channels * bpp
        preprocessor_num_blocks = 2
        segmentation_preprocessor = FormatConverterOp(
            self,
            name="segmentation_preprocessor",
            pool=BlockMemoryPool(
                self,
                storage_type=MemoryStorageType.DEVICE,
                block_size=preprocessor_block_size,
                num_blocks=preprocessor_num_blocks,
            ),
            cuda_stream_pool=cuda_stream_pool,
            **self.kwargs("segmentation_preprocessor"),
        )

        n_channels_inference = 2
        width_inference = 512
        height_inference = 512
        bpp_inference = 4
        inference_block_size = (
            width_inference * height_inference * n_channels_inference * bpp_inference
        )
        inference_num_blocks = 2
        segmentation_inference = InferenceOp(
            self,
            name="segmentation_inference_holoinfer",
            backend="trt",
            allocator=BlockMemoryPool(
                self,
                storage_type=MemoryStorageType.DEVICE,
                block_size=inference_block_size,
                num_blocks=inference_num_blocks,
            ),
            model_path_map=self.model_path_map,
            pre_processor_map={"ultrasound_seg": ["source_video"]},
            inference_map={"ultrasound_seg": "inference_output_tensor"},
            in_tensor_names=["source_video"],
            out_tensor_names=["inference_output_tensor"],
            enable_fp16=False,
            input_on_cuda=True,
            output_on_cuda=True,
            transmit_on_cuda=True,
        )

        info_op = InfoOp(
            self,
            name="info",
            pool=UnboundedAllocator(self, name="pool"),
        )

        postprocessor_block_size = width_inference * height_inference
        postprocessor_num_blocks = 2
        segmentation_postprocessor = SegmentationPostprocessorOp(
            self,
            name="segmentation_postprocessor",
            allocator=BlockMemoryPool(
                self,
                storage_type=MemoryStorageType.DEVICE,
                block_size=postprocessor_block_size,
                num_blocks=postprocessor_num_blocks,
            ),
            **self.kwargs("segmentation_postprocessor"),
        )

        segmentation_visualizer = HolovizOp(
            self,
            name="segmentation_visualizer",
            cuda_stream_pool=cuda_stream_pool,
            **self.kwargs("segmentation_visualizer"),
        )

        if is_aja:
            self.add_flow(source, segmentation_visualizer, {("video_buffer_output", "receivers")})
            self.add_flow(source, drop_alpha_channel, {("video_buffer_output", "")})
            self.add_flow(drop_alpha_channel, segmentation_preprocessor)
        else:
            self.add_flow(source, segmentation_visualizer, {("", "receivers")})
            self.add_flow(source, segmentation_preprocessor)
        self.add_flow(segmentation_preprocessor, segmentation_inference, {("", "receivers")})
        self.add_flow(segmentation_inference, info_op, {("transmitter", "in")})
        self.add_flow(info_op, segmentation_postprocessor, {("out", "")})
        self.add_flow(
            segmentation_postprocessor,
            segmentation_visualizer,
            {("", "receivers")},
        )

if __name__ == "__main__":
    # Parse args
    parser = ArgumentParser(description="Colonoscopy segmentation demo application.")
    parser.add_argument(
        "-s",
        "--source",
        choices=["replayer", "aja"],
        default="replayer",
        help=(
            "If 'replayer', replay a prerecorded video. If 'aja' use an AJA "
            "capture card as the source (default: %(default)s)."
        ),
    )
    parser.add_argument(
        "-c",
        "--config",
        default="none",
        help=("Set config path to override the default config file location"),
    )
    parser.add_argument(
        "-d",
        "--data",
        default="none",
        help=("Set the data path"),
    )
    args = parser.parse_args()

    if args.config == "none":
        config_file = os.path.join(os.path.dirname(__file__), "colonoscopy_segmentation.yaml")
    else:
        config_file = args.config

    app = ColonoscopyApp(source=args.source, data=args.data)
    app.config(config_file)
    app.run()

mxochicale commented 10 months ago

frames for basename: "out720x576" ls -la ck*.jpg -rwxrwxrwx 1 mxochicale mxochicale 172630 Oct 29 2019 ck2395w2mb4vu07480otsu6tw.jpg -rwxrwxrwx 1 mxochicale mxochicale 31882 Oct 29 2019 ck2bxiswtxuw80838qkisqjwz.jpg -rwxrwxrwx 1 mxochicale mxochicale 27147 Oct 29 2019 ck2bxknhjvs1x0794iogrq49k.jpg -rwxrwxrwx 1 mxochicale mxochicale 170555 Oct 29 2019 ck2bxlujamu330725szlc2jdu.jpg -rwxrwxrwx 1 mxochicale mxochicale 31749 Oct 29 2019 ck2bxpfgxu2mk0748gsh7xelu.jpg -rwxrwxrwx 1 mxochicale mxochicale 204412 Oct 29 2019 ck2bxqz3evvg20794iiyv5v2m.jpg -rwxrwxrwx 1 mxochicale mxochicale 29281 Oct 29 2019 ck2bxskgxxzfv08386xkqtqdy.jpg -rwxrwxrwx 1 mxochicale mxochicale 37883 Oct 29 2019 ck2bxw18mmz1k0725litqq2mc.jpg -rwxrwxrwx 1 mxochicale mxochicale 166204 Oct 30 2019 ck2da7fwcjfis07218r1rvm95.jpg

mxochicale commented 10 months ago

We might like to try to made use of only one frame to keep debugging

mxochicale commented 10 months ago

Thanks Mikael and Zhehua for your input on this one.

I am closing this one with successful implementation, debugging and documentation of InfoOp(Operator): See few screenshots and logs that might lead to future work:

https://github.com/SciKit-Surgery/cmicHACKS2/tree/main/nvidia-clara-agx/colonoscopy_segmentation#screenshots-of-colonoscopy_segmentationpy

SciKit-Surgery / cmicHACKS2

Implementation and debugging of InfoOp(Operator) in `colonoscopy_segmentation.py` #34

🚀 Feature