Update performance example with all changes this time

sfe-SparkFro · sfe-SparkFro · commit 08a7dbcbd501 · 2025-07-17T13:51:24.000-06:00
diff --git a/examples/ex05_performance.py b/examples/ex05_performance.py
@@ -12,38 +12,63 @@
 import cv2 as cv
 from cv2_hardware_init import *
 
-# Import NumPy
+# Import NumPy to create arrays
 from ulab import numpy as np
 
 # Import time for frame rate calculation
 import time
 
-# Initialize a loop timer to calculate processing speed in FPS
-loop_time = time.ticks_us()
+# Import garbage collector to measure memory usage
+import gc
+
+# Many OpenCV functions can take an optional output argument to store the result
+# of the operation. If it's not provided, OpenCV allocates a new array to store
+# the result, which can be slow and waste memory. When it is provided, OpenCV
+# instead writes the result to the provided array, reducing memory usage and
+# improving performance. The array must have the same shape and data type as the
+# expected output of the operation, otherwise a new array will be allocated.
+# 
+# Here we preallocate arrays for the destination arguments of this example. If
+# the shapes or data types are incorrect, OpenCV will simply allocate new arrays
+# for each on the first loop iteration. The variables will then be re-assigned,
+# so this only negatively affects the first loop iteration.
+frame = np.zeros((240, 320, 3), dtype=np.uint8)
+result_image = np.zeros((240, 320, 3), dtype=np.uint8)
 
 # Open the camera
 camera.open()
 
-# The `read()` method of OpenCV camera drivers can optionally take an output
-# image as an argument. When it's not provided, the camera driver must allocate
-# a whole new image for the frame, which can be slow and waste memory. If the
-# image argument is provided, then the camera driver will write the data to the
-# provided image. The image must be a NumPy array with the same shape and data
-# type as the camera's
-success, frame = camera.read()
+# Initialize a loop timer to calculate processing speed in FPS
+loop_time = time.ticks_us()
+
+# Initialize a variable to track memory usage
+last_mem_free = gc.mem_free()
 
 # Prompt the user to press a key to continue
 print("Press any key to continue")
 
 # Loop to continuously read frames from the camera and display them
 while True:
-    # Read a frame from the camera
-    success, frame = camera.read()
+    # Read a frame from the camera and measure how long it takes. Try running
+    # this both with and without the preallocated `frame` array to see the
+    # difference in performance
+    t0 = time.ticks_us()
+    success, frame = camera.read(frame)
+    t1 = time.ticks_us()
+    print("Read frame: %.2f ms" % ((t1 - t0) / 1_000), end='\t')
+
+    # Check if the frame was read successfully
     if not success:
         print("Failed to read frame from camera")
         break
 
-    # Now we'll 
+    # Now we'll do some processing on the frame. Try running this with and
+    # without the preallocated `result_image` array, and try different OpenCV
+    # functions to compare performance
+    t0 = time.ticks_us()
+    result_image = cv.cvtColor(frame, cv.COLOR_BGR2HSV, result_image)
+    t1 = time.ticks_us()
+    print("Processing: %.2f ms" % ((t1 - t0) / 1_000), end='\t')
 
     # It's a good idea to measure the frame rate of the main loop to see how
     # fast the entire pipeline is running. This will include not only the
@@ -53,10 +78,38 @@
     current_time = time.ticks_us()
     fps = 1_000_000 / (current_time - loop_time)
     loop_time = current_time
-    frame = cv.putText(frame, f"FPS: {fps:.2f}", (10, 30), cv.FONT_HERSHEY_SIMPLEX, 1, (0, 0, 255), 2)
+    print("FPS: %.2f" % fps, end='\t')
+    result_image = cv.putText(result_image, f"FPS: {fps:.2f}", (10, 30), cv.FONT_HERSHEY_SIMPLEX, 1, (255, 255, 255), 2)
 
     # Display the frame
-    cv.imshow(display, frame)
+    cv.imshow(display, result_image)
+
+    # We can also measure memory usage to see how much RAM is being consumed by
+    # this code. If you remove the output arguments from the functions above,
+    # you'll see that the memory consumption increases significantly as new
+    # arrays must be allocated each loop iteration
+    mem_free = gc.mem_free()
+    memory_used = last_mem_free - mem_free
+    last_mem_free = mem_free
+    print("Memory free: %d KiB" % (mem_free // 1024), end='\t')
+    print("Memory consumed: %d KiB" % (memory_used // 1024), end='\n')
+
+    # If the memory usage is negative, it means the garbage collector triggered
+    # and freed some memory. Garbage collection can take some time, so you'll
+    # notice a drop in FPS when it happens, and you may see a stutter in the
+    # video stream on the display. This is another reason to preallocate arrays,
+    # since it mitigates how frequently garbage collection is triggered
+    if memory_used < 0:
+        print("Garbage collection triggered!")
+    
+    # Something to try is triggering the garbage collector manually each loop
+    # iteration to immediately free up memory. Garbage collection can be faster
+    # if less memory has been allocated, so this can help avoid long stutters
+    # from occasional garbage collection. However garbage collection will always
+    # take *some* time, so this will lower the average FPS. You can choose to do
+    # this if you prefer a consistent frame rate, or don't if you prefer maximum
+    # frame rate and are okay with occasional stutters
+    # gc.collect()
 
     # Check for key presses
     key = cv.waitKey(1)