Added optimized Part 2 code.

Breakthrough · Breakthrough · commit fd854c0c9c47 · 2014-10-31T13:29:31.000-04:00
diff --git a/examples/part1-threshold.py b/examples/part1-threshold.py
@@ -8,18 +8,18 @@
 # algorithm using a set threshold compared to the average pixel intensity
 # of each frame. Usage:
 #
-#   > python part1-threshold.py [video-file] [intensity = 16]
+#   > python part1-threshold.py [video-file] [intensity = 15]
 #
 # Where [video-file] is a path to the video to be parsed, and [intensity]
 # is the average pixel intensity from 0 to 255 to be used as a cut-off
-# (if unspecified, the default value of 16 is used).  Example:
+# (if unspecified, the default value of 15 is used).  Example:
 #
 #   > python part1-threshold.py testvideo.mp4 8
 #
 # For each fade/cut that is detected, the timecodes and frame numbers
 # are printed to stdout. Note that this program depends on the Python
-# OpenCV bindings and NumPy.
-#
+# OpenCV bindings and NumPy. This software is a proof of concept related
+# to the tutorial above, so note many error checks are skipped for brevity.
 #
 # Copyright (C) 2013-2014 Brandon Castellano <http://www.bcastell.com>.
 #
@@ -42,6 +42,7 @@
 def main():
     if len(sys.argv) < 2:
         print "Error - file name must be specified as first argument."
+        print "See the header of part1-threshold.py for usage details."
         return
     
     cap = cv2.VideoCapture()
@@ -60,12 +61,11 @@ def main():
     print "Video Resolution: %d x %d" % (width, height)
 
     # Allow the threshold to be passed as an optional, second argument to the script.
-    threshold = 16
+    threshold = 15
     if len(sys.argv) > 2 and int(sys.argv[2]) > 0:
         threshold = int(sys.argv[2])
     print "Detecting scenes with threshold = %d.\n" % threshold
 
-
     last_mean  = 0                   # Mean intensity of the *last* frame processed.
     start_time = cv2.getTickCount()  # Used for benchmarking/statistics after loop.
 
diff --git a/examples/part2-adaptive.py b/examples/part2-adaptive.py
@@ -1,37 +1,21 @@
+#!/usr/bin/env python
 # 
 #      Scene Detection with Python and OpenCV - Example Program
 # Part 2: Adaptive Fade Detection             By: Brandon Castellano
 #
 # http://www.bcastell.com/tech-articles/pyscenedetect-tutorial-part-2/
 #
-# This Python program implements a more advanced and optimized threshold-
-# based scene detection algorithm, and improves the output format so
-# the scene cuts can be more easily imported into other programs (e.g.
-# ffmpeg, mkvmerge). Basic usage is:
+# This Python program implements an optimized, threshold-based
+# scene detection algorithm, and improves the output format so that
+# scene cuts can be more easily imported into other programs (e.g.
+# ffmpeg, mkvmerge).  Usage:
 #
-#   > python part2-adaptive.py [-h] -i VIDEO_FILE
+#   ./python part2-adaptive.py VIDEO_FILE [intensity = 16]
 #
-# Where -i denotes the input video, and -h shows the help message.
-# Optional arguments that can be passed after VIDEO_FILE are:
-#
-#  -h, --help            show this help message and exit
-#  -i VIDEO_FILE, --input VIDEO_FILE
-#                        [REQUIRED] Path to input video. (default: None)
-#  -t intensity, --threshold intensity
-#                        8-bit intensity value, from 0-255, to use as a fade
-#                        in/out detection threshold. (default: 8)
-#  -m percent, --minpercent percent
-#                        Amount of pixels in a frame, from 0-100%, that must
-#                        fall under [intensity]. (default: 95)
-#  -b rows, --blocksize rows
-#                        Number of rows in frame to check at once, can be tuned
-#                        for performance. (default: 32)
-#  -s offset, --startindex offset
-#                        Starting index for chapter/scene output. (default: 0)
-#
-# Example:
-#   > python part2-adaptive.py -i testvideo.mp4
-#   > python part2-adaptive.py -i testvideo.mp4  -t 8  -m 95  -b 32  -s 0
+# Which will export a list of scenes and their timecodes (by default)
+# detected in VIDEO_FILE, using the intensity as a threshold.  Other
+# parameters (e.g. minimum match percent and block size) can be
+# modified just above the main function in the source below.
 #
 # For each fade/cut that is detected, the timecodes and frame numbers
 # are printed to stdout. Note that this program depends on the Python
@@ -49,65 +33,97 @@
 # OTHER DEALINGS IN THE SOFTWARE.
 #
 
-
 import sys
-import argparse
-
 import cv2
 import numpy as np
 
 
-def int_type_check(min_val, max_val = None, metavar = None):
-    if metavar == None: metavar = 'value'
-    def _type_check(value):
-        value = int(value)
-        valid = True
-        msg   = ''
-        if (max_val == None):
-            if (value < min_val): valid = False
-            msg = 'invalid choice: %d (%s must be at least %d)' % (
-                value, metavar, min_val )
-        else:
-            if (value < min_val or value > max_val): valid = False
-            msg = 'invalid choice: %d (%s must be between %d and %d)' % (
-                value, metavar, min_val, max_val )
-        if not valid:
-            raise argparse.ArgumentTypeError(msg)
-        return value
-    return _type_check
-
-
-def get_cli_parser():
-    parser = argparse.ArgumentParser(
-        formatter_class = argparse.ArgumentDefaultsHelpFormatter)
-    parser._optionals.title = 'arguments'
-
-    parser.add_argument('-i', '--input', metavar = 'VIDEO_FILE',
-        type = file, required = True,
-        help = '[REQUIRED] Path to input video.')
-    parser.add_argument('-t', '--threshold',  metavar = 'intensity',
-        type = int_type_check(0, 255, 'intensity'), default = 8,
-        help = '8-bit intensity value, from 0-255, to use as a fade in/out detection threshold.')
-    parser.add_argument('-m', '--minpercent', metavar = 'percent',
-        type = int_type_check(0, 100, 'percentage'), default = 95,
-        help = 'Amount of pixels in a frame, from 0-100%%, that must fall under [intensity].')
-    parser.add_argument('-b', '--blocksize',  metavar = 'rows',
-        type = int_type_check(0, None, 'number of rows'), default = 32,
-        help = 'Number of rows in frame to check at once, can be tuned for performance.')
-    parser.add_argument('-s', '--startindex', metavar = 'offset',
-        type = int, default = 0,
-        help = 'Starting index for chapter/scene output.')
-
-    return parser
+# Advanced Scene Detection Parameters
+INTENSITY_THRESHOLD = 16    # Pixel intensity threshold (0-255), default 16
+MINIMUM_PERCENT     = 95    # Min. amount of pixels to be below threshold.
+BLOCK_SIZE          = 32    # Num. of rows to sum per iteration.
 
 
 def main():
-    args = get_cli_parser().parse_args()
+    if len(sys.argv) < 2:
+        print "Error - file name must be specified as first argument."
+        return
+    
+    cap = cv2.VideoCapture()
+    cap.open(sys.argv[1])
+    
+    if not cap.isOpened():
+        print "Fatal error - could not open video %s." % sys.argv[1]
+        return
+    else:
+        print "Parsing video %s..." % sys.argv[1]
+        
+    # Do stuff with cap here.
 
-    print args
+    width  = cap.get(cv2.cv.CV_CAP_PROP_FRAME_WIDTH)
+    height = cap.get(cv2.cv.CV_CAP_PROP_FRAME_HEIGHT)
+    print "Video Resolution: %d x %d" % (width, height)
+
+    # Allow the threshold to be passed as an optional, second argument to the script.
+    threshold = 16
+    if len(sys.argv) > 2 and int(sys.argv[2]) > 0:
+        threshold = int(sys.argv[2])
+    print "Detecting scenes with threshold = %d" % threshold
+    print "Min. pixels under threshold = %d %%" % MINIMUM_PERCENT
+    print "Block/row size = %d" % BLOCK_SIZE
+    print ""
+
+    min_percent = MINIMUM_PERCENT / 100.0
+    num_rows    = BLOCK_SIZE
+    last_amt    = 0     # Number of pixel values above threshold in last frame.
+    start_time  = cv2.getTickCount()  # Used for statistics after loop.
+
+    while True:
+        # Get next frame from video.
+        (rv, im) = cap.read()
+        if not rv:   # im is a valid image if and only if rv is true
+            break
+
+        # Compute # of pixel values and minimum amount to trigger fade.
+        num_pixel_vals = float(im.shape[0] * im.shape[1] * im.shape[2])
+        min_pixels     = int(num_pixel_vals * (1.0 - min_percent))
+
+        # Loop through frame block-by-block, updating current sum.
+        frame_amt = 0
+        curr_row  = 0
+        while curr_row < im.shape[0]:
+            # Add # of pixel values in current block above the threshold.
+            frame_amt += np.sum(
+                im[curr_row : curr_row + num_rows,:,:] > threshold )
+            if frame_amt > min_pixels:  # We can avoid checking the rest of the
+                break                   # frame since we crossed the boundary.
+            curr_row += num_rows
+
+        # Detect fade in from black.
+        if frame_amt >= min_pixels and last_amt < min_pixels:
+            print "Detected fade in at %dms (frame %d)." % (
+                cap.get(cv2.cv.CV_CAP_PROP_POS_MSEC),
+                cap.get(cv2.cv.CV_CAP_PROP_POS_FRAMES) )
+
+        # Detect fade out to black.
+        elif frame_amt < min_pixels and last_amt >= min_pixels:
+            print "Detected fade out at %dms (frame %d)." % (
+                cap.get(cv2.cv.CV_CAP_PROP_POS_MSEC),
+                cap.get(cv2.cv.CV_CAP_PROP_POS_FRAMES) )
+
+        last_amt = frame_amt      # Store current mean to compare in next iteration.
+
+    # Get # of frames in video based on the position of the last frame we read.
+    frame_count = cap.get(cv2.cv.CV_CAP_PROP_POS_FRAMES)
+    # Compute runtime and average framerate
+    total_runtime = float(cv2.getTickCount() - start_time) / cv2.getTickFrequency()
+    avg_framerate = float(frame_count) / total_runtime
+
+    print "Read %d frames from video in %4.2f seconds (avg. %4.1f FPS)." % (
+        frame_count, total_runtime, avg_framerate)
+
+    cap.release()
 
-    pass
 
-    
 if __name__ == "__main__":
     main()