'Process some problems about buffer size in GStreamer'

[prev in list] [next in list] [prev in thread] [next in thread] 

List:       gstreamer-devel
Subject:    Process some problems about buffer size in GStreamer
From:       Hùng_Triệu_Việt_via_gstreamer-devel <gstreamer-
Date:       2023-02-27 17:29:56
Message-ID: CAAG1Y3faU72Jw7sJOkxV7XjvVU5La6GJYS8SzrUnx5YhikFW0w () mail ! gmail ! com
[Download RAW message or body]

Hello guys, I'm new to GStreamer. I have a Python code about object
detection app using PyTorch, OpenCV to draw bounding boxes and GStreamer to
process multiple RTSP links. In this pipeline I'm using a video file to
demo:
filesrc ---> decodebin ---> videorate ---> videoconvert ---> queue --->
autovideosink
I have a problem, when I implement a simple code to save the output image,
the expected image must be an image with a frame cutted from input video
and have bounding boxes on that. Instead of that, I have an image with a
series of frames, like a flow of frames cut from input video with bounding
boxes on it (check this image: https://imgur.com/a/QKr4tN2).
Now I have no idea what to do, can someone give me advice on this?

This is my code:
import gi
gi.require_version('Gst', '1.0')
gi.require_version('GObject', '2.0')
from gi.repository import Gst
import numpy as np
import torch
from PIL import Image
import cv2
import time

Gst.init(None)

src = Gst.ElementFactory.make('filesrc', 'source')
src.set_property('location', 'video/test.mp4')
src.set_property('num-buffers', 9000)
decodebin = Gst.ElementFactory.make('decodebin', 'decoder')
videorate = Gst.ElementFactory.make('videorate', 'rate')
videorate.set_property('max-rate', 1)
videoconvert = Gst.ElementFactory.make('videoconvert', 'converter')
queue = Gst.ElementFactory.make('queue', 'queue')
autovideosink = Gst.ElementFactory.make('autovideosink', 's')

pipeline = Gst.Pipeline.new('new-pipeline')

pipeline.add(src)
pipeline.add(decodebin)
pipeline.add(videorate)
pipeline.add(videoconvert)
pipeline.add(queue)
pipeline.add(autovideosink)

def on_pad_added(element, pad):
    sinkpad = videoconvert.get_static_pad('sink')
    pad.link(sinkpad)

    decodebin.link(videorate)
    videorate.link(videoconvert)
    videoconvert.link(queue)
    queue.link(autovideosink)

    sinkpad = autovideosink.get_static_pad('sink')
    videoconvert.link(queue)

src.link(decodebin)
decodebin.connect('pad-added', on_pad_added)

device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')
detector = torch.hub.load('ultralytics/yolov5', 'custom', 'yolov5s.pt
').eval().to(device)

fps = 0
prev_time = time.time()

def on_frame_probe(pad, info):
    global fps, prev_time
    buf = info.get_buffer()
    # print(buf.get_size())
    print(f'[{buf.pts / Gst.SECOND:6.2f}]')
    image_tensor = buffer_to_image_tensor(buf, pad.get_current_caps())
    with torch.no_grad():
        detections = detector(image_tensor)
        current_time = time.time()
        fps = 1 / (current_time - prev_time)
        print("FPS: {0:.2f}".format(fps))
        prev_time = current_time
        print(detections)
        objects = (detections.xyxy[0]).tolist()
        img_np = np.array(image_tensor)
        for i in range(len(objects)):
            x_min, y_min, x_max, y_max = int(objects[i][0]),
int(objects[i][1]), int(objects[i][2]), int(objects[i][3])
            cv2.rectangle(img_np, (x_min, y_min), (x_max, y_max),
(255,0,0), 2)
        # Save the output image
        Image.fromarray(img_np[:,:,:3]).save("output.jpg")
    return Gst.PadProbeReturn.OK


def buffer_to_image_tensor(buf, caps):
    global fps
    caps_structure = caps.get_structure(0)
    height, width = caps_structure.get_value('height'),
caps_structure.get_value('width')
    channels = 3
    is_mapped, map_info = buf.map(Gst.MapFlags.READ)
    if is_mapped:
        try:
            image_array = np.frombuffer(map_info.data,
dtype=np.uint8).reshape((640, 1637, channels)).copy()
            image_array.resize((height, width, channels))
            image_array = cv2.cvtColor(image_array, cv2.COLOR_BGR2RGB)
            image_array = cv2.resize(image_array, (1920, 1080))
            return Image.fromarray(image_array) # RGBA -> RGB
        finally:
            buf.unmap(map_info)

pipeline.get_by_name('s').get_static_pad('sink').add_probe(
    Gst.PadProbeType.BUFFER,
    on_frame_probe
)

pipeline.set_state(Gst.State.PLAYING)

while True:
    msg = pipeline.get_bus().timed_pop_filtered(
        Gst.SECOND,
        Gst.MessageType.EOS | Gst.MessageType.ERROR
    )
    if msg:
        text = msg.get_structure().to_string() if msg.get_structure() else
''
        msg_type = Gst.message_type_get_name(msg.type)
        print(f'{msg.src.name}: [{msg_type}] {text}')
        break

pipeline.set_state(Gst.State.NULL)

The input video i got from this youtube link:
https://www.youtube.com/watch?v=MNn9qKG2UFI&list=PLcQZGj9lFR7y5WikozDSrdk6UCtAnM9mB
I appreciate you so much.
-- 
Trân trọng,

Triệu Việt Hùng

[Attachment #3 (text/html)]

<div dir="ltr">Hello guys, I&#39;m new to GStreamer. I have a Python code about \
object detection app using PyTorch, OpenCV to draw bounding boxes and GStreamer to \
process multiple RTSP links. In this pipeline I&#39;m using a video file to \
demo:<div>filesrc ---&gt; decodebin ---&gt; videorate ---&gt; videoconvert ---&gt; \
queue ---&gt; autovideosink<br clear="all"><div>I have a problem, when I implement a \
simple code to save the output image, the expected image must be an image with a \
frame cutted from input video and have bounding boxes on that. Instead of that, I \
have an image with a series of frames, like a flow of frames cut from input video \
with bounding boxes on it (check this image: <a \
href="https://imgur.com/a/QKr4tN2">https://imgur.com/a/QKr4tN2</a>).</div><div>Now I \
have no idea what to do, can someone give me advice on \
this?</div><div><br></div><div>This is my code:</div><div>import \
gi<br>gi.require_version(&#39;Gst&#39;, \
&#39;1.0&#39;)<br>gi.require_version(&#39;GObject&#39;, &#39;2.0&#39;)<br>from \
gi.repository import Gst<br>import numpy as np<br>import torch<br>from PIL import \
Image<br>import cv2<br>import time<br><br>Gst.init(None)<br><br>src = \
Gst.ElementFactory.make(&#39;filesrc&#39;, \
&#39;source&#39;)<br>src.set_property(&#39;location&#39;, \
&#39;video/test.mp4&#39;)<br>src.set_property(&#39;num-buffers&#39;, \
9000)<br>decodebin = Gst.ElementFactory.make(&#39;decodebin&#39;, \
&#39;decoder&#39;)<br>videorate = Gst.ElementFactory.make(&#39;videorate&#39;, \
&#39;rate&#39;)<br>videorate.set_property(&#39;max-rate&#39;, 1)<br>videoconvert = \
Gst.ElementFactory.make(&#39;videoconvert&#39;, &#39;converter&#39;)<br>queue = \
Gst.ElementFactory.make(&#39;queue&#39;, &#39;queue&#39;)<br>autovideosink = \
Gst.ElementFactory.make(&#39;autovideosink&#39;, &#39;s&#39;)<br><br>pipeline = \
Gst.Pipeline.new(&#39;new-pipeline&#39;)<br><br>pipeline.add(src)<br>pipeline.add(deco \
debin)<br>pipeline.add(videorate)<br>pipeline.add(videoconvert)<br>pipeline.add(queue)<br>pipeline.add(autovideosink)<br><br>def \
on_pad_added(element, pad):<br>      sinkpad = \
videoconvert.get_static_pad(&#39;sink&#39;)<br>      pad.link(sinkpad)<br>      <br>  \
decodebin.link(videorate)<br>      videorate.link(videoconvert)<br>      \
videoconvert.link(queue)<br>      queue.link(autovideosink)<br>      <br>      \
sinkpad = autovideosink.get_static_pad(&#39;sink&#39;)<br>      \
videoconvert.link(queue)<br>      \
<br>src.link(decodebin)<br>decodebin.connect(&#39;pad-added&#39;, \
on_pad_added)<br><br>device = torch.device(&#39;cuda&#39; if \
torch.cuda.is_available() else &#39;cpu&#39;)<br>detector = \
torch.hub.load(&#39;ultralytics/yolov5&#39;, &#39;custom&#39;, &#39;<a \
href="http://yolov5s.pt">yolov5s.pt</a>&#39;).eval().to(device)<br><br>fps = \
0<br>prev_time = time.time()<br><br>def on_frame_probe(pad, info):<br>      global \
fps, prev_time<br>      buf = info.get_buffer()<br>      # print(buf.get_size())<br>  \
print(f&#39;[{buf.pts / Gst.SECOND:6.2f}]&#39;)<br>      image_tensor = \
buffer_to_image_tensor(buf, pad.get_current_caps())<br>      with \
torch.no_grad():<br>            detections = detector(image_tensor)<br>            \
current_time = time.time()<br>            fps = 1 / (current_time - prev_time)<br>    \
print(&quot;FPS: {0:.2f}&quot;.format(fps))<br>            prev_time = \
current_time<br>            print(detections)<br>            objects = \
(detections.xyxy[0]).tolist()<br>            img_np = np.array(image_tensor)<br>      \
for i in range(len(objects)):<br>                  x_min, y_min, x_max, y_max = \
int(objects[i][0]), int(objects[i][1]), int(objects[i][2]), int(objects[i][3])<br>    \
cv2.rectangle(img_np, (x_min, y_min), (x_max, y_max), (255,0,0), 2)<br>            # \
Save the output image<br>            \
Image.fromarray(img_np[:,:,:3]).save(&quot;output.jpg&quot;)<br>      return \
Gst.PadProbeReturn.OK<br><br><br>def buffer_to_image_tensor(buf, caps):<br>      \
global fps<br>      caps_structure = caps.get_structure(0)<br>      height, width = \
caps_structure.get_value(&#39;height&#39;), \
caps_structure.get_value(&#39;width&#39;)<br>      channels = 3<br>      is_mapped, \
map_info = buf.map(Gst.MapFlags.READ)<br>      if is_mapped:<br>            try:<br>  \
image_array = np.frombuffer(map_info.data, dtype=np.uint8).reshape((640, 1637, \
channels)).copy()<br>                  image_array.resize((height, width, \
channels))<br>                  image_array = cv2.cvtColor(image_array, \
cv2.COLOR_BGR2RGB)<br>                  image_array = cv2.resize(image_array, (1920, \
1080))<br>                  return Image.fromarray(image_array) # RGBA -&gt; RGB<br>  \
finally:<br>                  \
buf.unmap(map_info)<br><br>pipeline.get_by_name(&#39;s&#39;).get_static_pad(&#39;sink&#39;).add_probe(<br> \
Gst.PadProbeType.BUFFER,<br>      \
on_frame_probe<br>)<br><br>pipeline.set_state(Gst.State.PLAYING)<br><br>while \
True:<br>      msg = pipeline.get_bus().timed_pop_filtered(<br>            \
Gst.SECOND,<br>            Gst.MessageType.EOS | Gst.MessageType.ERROR<br>      )<br> \
if msg:<br>            text = msg.get_structure().to_string() if msg.get_structure() \
else &#39;&#39;<br>            msg_type = Gst.message_type_get_name(msg.type)<br>     \
print(f&#39;{<a href="http://msg.src.name">msg.src.name</a>}: [{msg_type}] \
{text}&#39;)<br>            \
break<br><br>pipeline.set_state(Gst.State.NULL)<br></div><div><br></div><div>The \
input video i got from this youtube link:  <a \
href="https://www.youtube.com/watch?v=MNn9qKG2UFI&amp;list=PLcQZGj9lFR7y5WikozDSrdk6UC \
tAnM9mB">https://www.youtube.com/watch?v=MNn9qKG2UFI&amp;list=PLcQZGj9lFR7y5WikozDSrdk6UCtAnM9mB</a></div><div>I \
appreciate you so much.</div>-- <br><div dir="ltr" class="gmail_signature" \
data-smartmail="gmail_signature"><div dir="ltr"><div>Trân \
trọng,</div><div><br></div>Triệu Việt Hùng</div></div></div></div>



[prev in list] [next in list] [prev in thread] [next in thread]
Configure | About | News | Add a list | Sponsored by KoreLogic