Run yolov3_tiny.engine from python

Hi,

We can run the YOLO engine with below script without issue.
Could you give it a try?

import ctypes
import pycuda.autoinit
import pycuda.driver as cuda
import tensorrt as trt
import numpy as np

ctypes.CDLL("/opt/nvidia/deepstream/deepstream-5.0/sources/objectDetector_Yolo/nvdsinfer_custom_impl_Yolo/libnvdsinfer_custom_impl_Yolo.so")
TRT_LOGGER = trt.Logger(trt.Logger.VERBOSE)

with open("model_b1_gpu0_fp32.engine", "rb") as f, trt.Runtime(TRT_LOGGER) as runtime:
    engine = runtime.deserialize_cuda_engine(f.read())
    context = engine.create_execution_context()

    bindings = []
    for binding in engine:
        size = trt.volume(engine.get_binding_shape(binding)) * engine.max_batch_size
        bindings.append(int(cuda.mem_alloc(4*size)))

    stream = cuda.Stream()
    context = engine.create_execution_context()
    context.execute_async(bindings=bindings, stream_handle=stream.handle)
    stream.synchronize()

Thanks.