#!/usr/bin/env python3importvpiimportnumpyasnpimporttime# Maximum performance on Jetsonimportsubprocesssubprocess.run("sudo jetson_clocks",shell=True)img=np.random.randint(0,255,(1080,1920,3),dtype=np.uint8)start=time.time()withvpi.Backend.CUDA:frame=vpi.asimage(img,vpi.Format.BGR8).convert(vpi.Format.U8)corners,scores=frame.harriscorners()# This causes GPU→CPU transfer (shows in profiler)corners_cpu=corners.cpu()print(f"Time: {(time.time()-start)*1000:.2f}ms")