linux-sdk-python/examples/image/classify-video.py at master · edgeimpulse/linux-sdk-python

144 lines (115 loc) · 6.38 KB
#!/usr/bin/env python
import device_patches       # Device specific patches for Jetson Nano (needs to be before importing cv2)
    import cv2
except ImportError:
    print('Missing OpenCV, install via `pip3 install "opencv-python>=4.5.1.48,<5"`')
    exit(1)
import time
import sys, getopt
from edge_impulse_linux.image import ImageImpulseRunner
runner = None
# if you don't want to see a video preview, set this to False
show_camera = True
if (sys.platform == 'linux' and not os.environ.get('DISPLAY')):
    show_camera = False
def help():
    print('python classify-video.py <path_to_model.eim> <path_to_video.mp4>')
def main(argv):
        opts, args = getopt.getopt(argv, "h", ["--help"])
    except getopt.GetoptError:
        help()
        sys.exit(2)
    for opt, arg in opts:
        if opt in ('-h', '--help'):
            help()
            sys.exit()
    if len(args) != 2:
        help()
        sys.exit(2)
    model = args[0]
    dir_path = os.path.dirname(os.path.realpath(__file__))
    modelfile = os.path.join(dir_path, model)
    print('MODEL: ' + modelfile)
    with ImageImpulseRunner(modelfile) as runner:
        try:
            model_info = runner.init()
            # model_info = runner.init(debug=True, timeout=60) # to get debug print out and set longer timeout
            print('Loaded runner for "' + model_info['project']['owner'] + ' / ' + model_info['project']['name'] + '"')
            labels = model_info['model_parameters']['labels']
            vidcap = cv2.VideoCapture(args[1])
            sec = 0
            start_time = time.time()
            def getFrame(sec):
                vidcap.set(cv2.CAP_PROP_POS_MSEC,sec*1000)
                hasFrames,image = vidcap.read()
                if hasFrames:
                    return image
                else:
                    print('Failed to load frame', args[1])
                    exit(1)
            img = getFrame(sec)
            while img.size != 0:
                # imread returns images in BGR format, so we need to convert to RGB
                img = cv2.cvtColor(img, cv2.COLOR_BGR2RGB)
                # get_features_from_image also takes a crop direction arguments in case you don't have square images
                features, cropped = runner.get_features_from_image(img)
                # the image will be resized and cropped, save a copy of the picture here
                # so you can see what's being passed into the classifier
                cv2.imwrite('debug.jpg', cv2.cvtColor(cropped, cv2.COLOR_RGB2BGR))
                res = runner.classify(features)
                if "classification" in res["result"].keys():
                    print('Result (%d ms.) ' % (res['timing']['dsp'] + res['timing']['classification']), end='')
                    for label in labels:
                        score = res['result']['classification'][label]
                        print('%s: %.2f\t' % (label, score), end='')
                    print('', flush=True)
                elif "bounding_boxes" in res["result"].keys():
                    print('Found %d bounding boxes (%d ms.)' % (len(res["result"]["bounding_boxes"]), res['timing']['dsp'] + res['timing']['classification']))
                    for bb in res["result"]["bounding_boxes"]:
                        print('\t%s (%.2f): x=%d y=%d w=%d h=%d' % (bb['label'], bb['value'], bb['x'], bb['y'], bb['width'], bb['height']))
                        img = cv2.rectangle(cropped, (bb['x'], bb['y']), (bb['x'] + bb['width'], bb['y'] + bb['height']), (255, 0, 0), 1)
                elif "freeform" in res['result'].keys():
                    print('Result (%d ms.)' % (res['timing']['dsp'] + res['timing']['classification']))
                    for i in range(0, len(res['result']['freeform'])):
                        print(f'    Freeform output {i}:', ", ".join(f"{x:.4f}" for x in res['result']['freeform'][i]))
                # Object tracking output
                if "object_tracking" in res["result"].keys():
                    print('Found %d tracked objects' % (len(res["result"]["object_tracking"])))
                    for obj in res["result"]["object_tracking"]:
                        print('\tID=%s, label=%s, value=%.2f, x=%d, y=%d, w=%d, h=%d' % (
                            obj['object_id'], obj['label'], obj['value'], obj['x'], obj['y'], obj['width'], obj['height']))
                        # Draw bounding box
                        x = obj['x']
                        y = obj['y']
                        w = obj['width']
                        h = obj['height']
                        img = cv2.rectangle(cropped, (x, y), (x + w, y + h), (0, 255, 0), 2)
                        # Draw label and ID
                        label_id_text = f"ID={obj['object_id']}, {obj['label']}"
                        text_x = x
                        text_y = y - 10 if y - 10 > 10 else y + 20
                        img = cv2.putText(img, label_id_text, (text_x, text_y),
                                          cv2.FONT_HERSHEY_SIMPLEX, 0.5, (0, 255, 0), 2)
                if "visual_anomaly_grid" in res["result"].keys():
                    print('Found %d visual anomalies (%d ms.)' % (len(res["result"]["visual_anomaly_grid"]), res['timing']['dsp'] +
                                                                                                                res['timing']['classification'] +
                    for grid_cell in res["result"]["visual_anomaly_grid"]:
                        print('\t%s (%.2f): x=%d y=%d w=%d h=%d' % (grid_cell['label'], grid_cell['value'], grid_cell['x'], grid_cell['y'], grid_cell['width'], grid_cell['height']))
                        img = cv2.rectangle(cropped, (grid_cell['x'], grid_cell['y']), (grid_cell['x'] + grid_cell['width'], grid_cell['y'] + grid_cell['height']), (255, 125, 0), 1)
                if (show_camera):
                    cv2.imshow('edgeimpulse', cv2.cvtColor(cropped, cv2.COLOR_RGB2BGR))
                    if cv2.waitKey(1) == ord('q'):
                sec = time.time() - start_time
                sec = round(sec, 2)
                print("Getting frame at: %.2f sec" % sec)
                img = getFrame(sec)
        finally:
            if (runner):
                runner.stop()
if __name__ == "__main__":
   main(sys.argv[1:])
Provide feedback

Saved searches

Use saved searches to filter your results more quickly

FilesExpand file tree

classify-video.py

Latest commit

History

classify-video.py

File metadata and controls