Spaces:

RTL
/

videomatch

Build error

App Files Files Community

dodijk commited on Sep 30, 2022

Commit

7971a7a

•

1 Parent(s): 48017c0

Refactor app.py into separate files

Browse files

Files changed (4) hide show

app.py +12 -177
config.py +7 -0
videohash.py +57 -0
videomatch.py +100 -0

app.py CHANGED Viewed

@@ -1,166 +1,23 @@
-import tempfile
-import urllib.request
 import logging
-import os
-import hashlib
-import datetime
 import time
 import pandas
 import gradio as gr
-from moviepy.editor import VideoFileClip
 import seaborn as sns
 import matplotlib.pyplot as plt
-import imagehash
-from PIL import Image
 import numpy as np
 import pandas as pd
-import faiss
-import shutil
-from kats.detectors.cusum_detection import CUSUMDetector
-from kats.detectors.robust_stat_detection import RobustStatDetector
-from kats.consts import TimeSeriesData
-FPS = 5
-MIN_DISTANCE = 4
-MAX_DISTANCE = 30
-video_directory = tempfile.gettempdir()
-def move_video_to_tempdir(input_dir, filename):
-    new_filename = os.path.join(video_directory, filename)
-    input_file = os.path.join(input_dir, filename)
-    if not os.path.exists(new_filename):
-        shutil.copyfile(input_file, new_filename)
-        logging.info(f"Copied {input_file} to {new_filename}.")
-    else:
-        logging.info(f"Skipping copying from {input_file} because {new_filename} already exists.")
-    return new_filename
-def download_video_from_url(url):
-    """Download video from url or return md5 hash as video name"""
-    filename = filename_from_url(url)
-    if not os.path.exists(filename):
-        with (urllib.request.urlopen(url)) as f, open(filename, 'wb') as fileout:
-            fileout.write(f.read())
-        logging.info(f"Downloaded video from {url} to {filename}.")
-    else:
-        logging.info(f"Skipping downloading from {url} because {filename} already exists.")
-    return filename
-def change_ffmpeg_fps(clip, fps=FPS):
-    # Hacking the ffmpeg call based on
-    # https://github.com/Zulko/moviepy/blob/master/moviepy/video/io/ffmpeg_reader.py#L126
-    import subprocess as sp
-    cmd = [arg + ",fps=%d" % fps if arg.startswith("scale=") else arg for arg in clip.reader.proc.args]
-    clip.reader.close()
-    clip.reader.proc = sp.Popen(cmd, bufsize=clip.reader.bufsize,
-                                stdout=sp.PIPE, stderr=sp.PIPE, stdin=sp.DEVNULL)
-    clip.fps = clip.reader.fps = fps
-    clip.reader.lastread = clip.reader.read_frame()
-    return clip
-def compute_hash(frame, hash_size=16):
-    image = Image.fromarray(np.array(frame))
-    return imagehash.phash(image, hash_size)
-def binary_array_to_uint8s(arr):
-    bit_string = ''.join(str(1 * x) for l in arr for x in l)
-    return [int(bit_string[i:i+8], 2) for i in range(0, len(bit_string), 8)]
-def compute_hashes(clip, fps=FPS):
-    for index, frame in enumerate(change_ffmpeg_fps(clip, fps).iter_frames()):
-        # Each frame is a triplet of size (height, width, 3) of the video since it is RGB
-        # The hash itself is of size (hash_size, hash_size)
-        # The uint8 version of the hash is of size (hash_size * highfreq_factor,) and represents the hash
-        hashed = np.array(binary_array_to_uint8s(compute_hash(frame).hash), dtype='uint8')
-        yield {"frame": 1+index*fps, "hash": hashed}
-def index_hashes_for_video(url, is_file = False):
-    """ Download a video if it is a url, otherwise refer to the file. Secondly index the video
-    using faiss indices and return thi index. """
-    if not is_file:
-        filename = download_video_from_url(url)
-    else:
-        filename = url
-    if os.path.exists(f'{filename}.index'):
-        logging.info(f"Loading indexed hashes from {filename}.index")
-        binary_index = faiss.read_index_binary(f'{filename}.index')
-        logging.info(f"Index {filename}.index has in total {binary_index.ntotal} frames")
-        return binary_index
-    download_video_from_url(url)
-    hash_vectors = np.array([x['hash'] for x in compute_hashes(VideoFileClip(filename))])
-    logging.info(f"Computed hashes for {hash_vectors.shape} frames.")
-    # Initializing the quantizer.
-    quantizer = faiss.IndexBinaryFlat(hash_vectors.shape[1]*8)
-    # Initializing index.
-    index = faiss.IndexBinaryIVF(quantizer, hash_vectors.shape[1]*8, min(16, hash_vectors.shape[0]))
-    index.nprobe = 1 # Number of nearest clusters to be searched per query.
-    # Training the quantizer.
-    index.train(hash_vectors)
-    #index = faiss.IndexBinaryFlat(64)
-    index.add(hash_vectors)
-    faiss.write_index_binary(index, f'{filename}.index')
-    logging.info(f"Indexed hashes for {index.ntotal} frames to {filename}.index.")
-    return index
-def get_video_indices(url, target, MIN_DISTANCE = 4):
-    """" The comparison between the target and the original video will be plotted based
-    on the matches between the target and the original video over time. The matches are determined
-    based on the minimum distance between hashes (as computed by faiss-vectors) before they're considered a match.
-    args:
-    - url: url of the source video (short video which you want to be checked)
-    - target: url of the target video (longer video which is a superset of the source video)
-    - MIN_DISTANCE: integer representing the minimum distance between hashes on bit-level before its considered a match
-    """
-    # TODO: Fix crash if no matches are found
-    is_file = False
-    if url.endswith('.mp4'):
-        is_file = True
-    # Url (short video)
-    video_index = index_hashes_for_video(url, is_file)
-    video_index.make_direct_map() # Make sure the index is indexable
-    hash_vectors = np.array([video_index.reconstruct(i) for i in range(video_index.ntotal)]) # Retrieve original indices
-    # Target video (long video)
-    target_indices = [index_hashes_for_video(x) for x in [target]]
-    return video_index, hash_vectors, target_indices
-def compare_videos(video_index, hash_vectors, target_indices, MIN_DISTANCE = 3): # , is_file = False):
-    """ Search for matches between the indices of the  target video (long video)
-    and the given hash vectors of a video"""
-    # The results are returned as a triplet of 1D arrays
-    # lims, D, I, where result for query i is in I[lims[i]:lims[i+1]]
-    # (indices of neighbors), D[lims[i]:lims[i+1]] (distances).
-    lims, D, I = target_indices[0].range_search(hash_vectors, MIN_DISTANCE)
-    return lims, D, I, hash_vectors
-def get_decent_distance(url, target, MIN_DISTANCE, MAX_DISTANCE):
-    """ To get a decent heurstic for a base distance check every distance from MIN_DISTANCE to MAX_DISTANCE
-    until the number of matches found is equal to or higher than the number of frames in the source video"""
-    for distance in np.arange(start = MIN_DISTANCE - 2, stop = MAX_DISTANCE + 2, step = 2, dtype=int):
-        distance = int(distance)
-        video_index, hash_vectors, target_indices = get_video_indices(url, target, MIN_DISTANCE = distance)
-        lims, D, I, hash_vectors = compare_videos(video_index, hash_vectors, target_indices, MIN_DISTANCE = distance)
-        nr_source_frames = video_index.ntotal
-        nr_matches = len(D)
-        logging.info(f"{(nr_matches/nr_source_frames) * 100.0:.1f}% of frames have a match for distance '{distance}' ({nr_matches} matches for {nr_source_frames} frames)")
-        if nr_matches >= nr_source_frames:
-            return distance
-    logging.warning(f"No matches found for any distance between {MIN_DISTANCE} and {MAX_DISTANCE}")
-    return None
 def plot_comparison(lims, D, I, hash_vectors, MIN_DISTANCE = 3):
     sns.set_theme()
@@ -193,9 +50,6 @@ def plot_comparison(lims, D, I, hash_vectors, MIN_DISTANCE = 3):
     plt.subplots_adjust(bottom=0.25, left=0.20)
     return fig
-logging.basicConfig()
-logging.getLogger().setLevel(logging.INFO)
 def plot_multi_comparison(df, change_points):
     """ From the dataframe plot the current set of plots, where the bottom right is most indicative """
     fig, ax_arr = plt.subplots(3, 2, figsize=(12, 6), dpi=100, sharex=True)
@@ -218,7 +72,7 @@ def plot_multi_comparison(df, change_points):
 def get_videomatch_df(url, target, min_distance=MIN_DISTANCE, vanilla_df=False):
     distance = get_decent_distance(url, target, MIN_DISTANCE, MAX_DISTANCE)
     video_index, hash_vectors, target_indices = get_video_indices(url, target, MIN_DISTANCE = distance)
-    lims, D, I, hash_vectors = compare_videos(video_index, hash_vectors, target_indices, MIN_DISTANCE = distance)
     target = [(lims[i+1]-lims[i]) * [i] for i in range(hash_vectors.shape[0])]
     target_s = [i/FPS for j in target for i in j]
@@ -272,26 +126,10 @@ def get_videomatch_df(url, target, min_distance=MIN_DISTANCE, vanilla_df=False):
     df['time'] = pd.to_datetime(df["TARGET_S"], unit='s') # Needs a datetime as input
     return df
-def get_change_points(df, smoothing_window_size=10, method='CUSUM'):
-    tsd = TimeSeriesData(df.loc[:,['time','OFFSET_LIP']])
-    if method.upper() == "CUSUM":
-        detector = CUSUMDetector(tsd)
-    elif method.upper() == "ROBUST":
-        detector = RobustStatDetector(tsd)
-    change_points =  detector.detector(smoothing_window_size=smoothing_window_size, comparison_window=-2)
-    # Print some stats
-    if method.upper() == "CUSUM" and change_points != []:
-        mean_offset_prechange = change_points[0].mu0
-        mean_offset_postchange = change_points[0].mu1
-        jump_s = mean_offset_postchange - mean_offset_prechange
-        print(f"Video jumps {jump_s:.1f}s in time at {mean_offset_prechange:.1f} seconds")
-    return change_points
 def get_comparison(url, target, MIN_DISTANCE = 4):
     """ Function for Gradio to combine all helper functions"""
     video_index, hash_vectors, target_indices = get_video_indices(url, target, MIN_DISTANCE = MIN_DISTANCE)
-    lims, D, I, hash_vectors = compare_videos(video_index, hash_vectors, target_indices, MIN_DISTANCE = MIN_DISTANCE)
     fig = plot_comparison(lims, D, I, hash_vectors, MIN_DISTANCE = MIN_DISTANCE)
     return fig
@@ -301,7 +139,7 @@ def get_auto_comparison(url, target, smoothing_window_size=10, method="CUSUM"):
     if distance == None:
         raise gr.Error("No matches found!")
     video_index, hash_vectors, target_indices = get_video_indices(url, target, MIN_DISTANCE = distance)
-    lims, D, I, hash_vectors = compare_videos(video_index, hash_vectors, target_indices, MIN_DISTANCE = distance)
     # fig = plot_comparison(lims, D, I, hash_vectors, MIN_DISTANCE = distance)
     df = get_videomatch_df(url, target, min_distance=MIN_DISTANCE, vanilla_df=False)
     change_points = get_change_points(df, smoothing_window_size=smoothing_window_size, method=method)
@@ -337,8 +175,5 @@ if __name__ == "__main__":
     import matplotlib
     matplotlib.use('SVG') # To be able to plot in gradio
-    logging.basicConfig()
-    logging.getLogger().setLevel(logging.INFO)
     iface.launch(inbrowser=True, debug=True)
     #iface.launch(auth=("test", "test"), share=True, debug=True)

 import logging
 import time
 import pandas
 import gradio as gr
 import seaborn as sns
 import matplotlib.pyplot as plt
 import numpy as np
 import pandas as pd
+from config import *
+from videomatch import index_hashes_for_video, get_decent_distance, \
+    get_video_indices, compare_videos, get_change_points
+logging.basicConfig()
+logging.getLogger().setLevel(logging.INFO)
 def plot_comparison(lims, D, I, hash_vectors, MIN_DISTANCE = 3):
     sns.set_theme()
     plt.subplots_adjust(bottom=0.25, left=0.20)
     return fig
 def plot_multi_comparison(df, change_points):
     """ From the dataframe plot the current set of plots, where the bottom right is most indicative """
     fig, ax_arr = plt.subplots(3, 2, figsize=(12, 6), dpi=100, sharex=True)
 def get_videomatch_df(url, target, min_distance=MIN_DISTANCE, vanilla_df=False):
     distance = get_decent_distance(url, target, MIN_DISTANCE, MAX_DISTANCE)
     video_index, hash_vectors, target_indices = get_video_indices(url, target, MIN_DISTANCE = distance)
+    lims, D, I, hash_vectors = compare_videos(hash_vectors, target_indices, MIN_DISTANCE = distance)
     target = [(lims[i+1]-lims[i]) * [i] for i in range(hash_vectors.shape[0])]
     target_s = [i/FPS for j in target for i in j]
     df['time'] = pd.to_datetime(df["TARGET_S"], unit='s') # Needs a datetime as input
     return df
 def get_comparison(url, target, MIN_DISTANCE = 4):
     """ Function for Gradio to combine all helper functions"""
     video_index, hash_vectors, target_indices = get_video_indices(url, target, MIN_DISTANCE = MIN_DISTANCE)
+    lims, D, I, hash_vectors = compare_videos(hash_vectors, target_indices, MIN_DISTANCE = MIN_DISTANCE)
     fig = plot_comparison(lims, D, I, hash_vectors, MIN_DISTANCE = MIN_DISTANCE)
     return fig
     if distance == None:
         raise gr.Error("No matches found!")
     video_index, hash_vectors, target_indices = get_video_indices(url, target, MIN_DISTANCE = distance)
+    lims, D, I, hash_vectors = compare_videos(hash_vectors, target_indices, MIN_DISTANCE = distance)
     # fig = plot_comparison(lims, D, I, hash_vectors, MIN_DISTANCE = distance)
     df = get_videomatch_df(url, target, min_distance=MIN_DISTANCE, vanilla_df=False)
     change_points = get_change_points(df, smoothing_window_size=smoothing_window_size, method=method)
     import matplotlib
     matplotlib.use('SVG') # To be able to plot in gradio
     iface.launch(inbrowser=True, debug=True)
     #iface.launch(auth=("test", "test"), share=True, debug=True)

config.py ADDED Viewed

	@@ -0,0 +1,7 @@

+import tempfile
+VIDEO_DIRECTORY = tempfile.gettempdir()
+FPS = 5
+MIN_DISTANCE = 4
+MAX_DISTANCE = 30

videohash.py ADDED Viewed

	@@ -0,0 +1,57 @@

+import os
+import urllib.request
+import logging
+import hashlib
+from PIL import Image
+import imagehash
+from moviepy.editor import VideoFileClip
+import numpy as np
+from config import FPS, VIDEO_DIRECTORY
+def filepath_from_url(url):
+    """Return filepath based on a md5 hash of a url."""
+    return os.path.join(VIDEO_DIRECTORY, hashlib.md5(url.encode()).hexdigest())
+def download_video_from_url(url):
+    """Download video from url or return md5 hash as video name"""
+    filepath = filepath_from_url(url)
+    if not os.path.exists(filepath):
+        with (urllib.request.urlopen(url)) as f, open(filepath, 'wb') as fileout:
+            fileout.write(f.read())
+        logging.info(f"Downloaded video from {url} to {filepath}.")
+    else:
+        logging.info(f"Skipping downloading from {url} because {filepath} already exists.")
+    return filepath
+def change_ffmpeg_fps(clip, fps=FPS):
+    # Hacking the ffmpeg call based on
+    # https://github.com/Zulko/moviepy/blob/master/moviepy/video/io/ffmpeg_reader.py#L126
+    import subprocess as sp
+    cmd = [arg + ",fps=%d" % fps if arg.startswith("scale=") else arg for arg in clip.reader.proc.args]
+    clip.reader.close()
+    clip.reader.proc = sp.Popen(cmd, bufsize=clip.reader.bufsize,
+                                stdout=sp.PIPE, stderr=sp.PIPE, stdin=sp.DEVNULL)
+    clip.fps = clip.reader.fps = fps
+    clip.reader.lastread = clip.reader.read_frame()
+    return clip
+def compute_hash(frame, hash_size=16):
+    image = Image.fromarray(np.array(frame))
+    return imagehash.phash(image, hash_size)
+def binary_array_to_uint8s(arr):
+    bit_string = ''.join(str(1 * x) for l in arr for x in l)
+    return [int(bit_string[i:i+8], 2) for i in range(0, len(bit_string), 8)]
+def compute_hashes(url: str, fps=FPS):
+    clip = VideoFileClip(download_video_from_url(url))
+    for index, frame in enumerate(change_ffmpeg_fps(clip, fps).iter_frames()):
+        # Each frame is a triplet of size (height, width, 3) of the video since it is RGB
+        # The hash itself is of size (hash_size, hash_size)
+        # The uint8 version of the hash is of size (hash_size * highfreq_factor,) and represents the hash
+        hashed = np.array(binary_array_to_uint8s(compute_hash(frame).hash), dtype='uint8')
+        yield {"frame": 1+index*fps, "hash": hashed}

videomatch.py ADDED Viewed

	@@ -0,0 +1,100 @@

+import os
+import logging
+import faiss
+from kats.detectors.cusum_detection import CUSUMDetector
+from kats.detectors.robust_stat_detection import RobustStatDetector
+from kats.consts import TimeSeriesData
+import numpy as np
+from videohash import compute_hashes, filepath_from_url
+def index_hashes_for_video(url: str) -> faiss.IndexBinaryIVF:
+    """ Compute hashes of a video and index the video using faiss indices and return the index. """
+    filepath = filepath_from_url(url)
+    if os.path.exists(f'{filepath}.index'):
+        logging.info(f"Loading indexed hashes from {filepath}.index")
+        binary_index = faiss.read_index_binary(f'{filepath}.index')
+        logging.info(f"Index {filepath}.index has in total {binary_index.ntotal} frames")
+        return binary_index
+    hash_vectors = np.array([x['hash'] for x in compute_hashes(url)])
+    logging.info(f"Computed hashes for {hash_vectors.shape} frames.")
+    # Initializing the quantizer.
+    quantizer = faiss.IndexBinaryFlat(hash_vectors.shape[1]*8)
+    # Initializing index.
+    index = faiss.IndexBinaryIVF(quantizer, hash_vectors.shape[1]*8, min(16, hash_vectors.shape[0]))
+    index.nprobe = 1 # Number of nearest clusters to be searched per query.
+    # Training the quantizer.
+    index.train(hash_vectors)
+    #index = faiss.IndexBinaryFlat(64)
+    index.add(hash_vectors)
+    faiss.write_index_binary(index, f'{filepath}.index')
+    logging.info(f"Indexed hashes for {index.ntotal} frames to {filepath}.index.")
+    return index
+def get_video_indices(filepath: str, target: str, MIN_DISTANCE: int = 4):
+    """" The comparison between the target and the original video will be plotted based
+    on the matches between the target and the original video over time. The matches are determined
+    based on the minimum distance between hashes (as computed by faiss-vectors) before they're considered a match.
+    args:
+    - url: url of the source video (short video which you want to be checked)
+    - target: url of the target video (longer video which is a superset of the source video)
+    - MIN_DISTANCE: integer representing the minimum distance between hashes on bit-level before its considered a match
+    """
+    # TODO: Fix crash if no matches are found
+    # Url (short video)
+    video_index = index_hashes_for_video(filepath)
+    video_index.make_direct_map() # Make sure the index is indexable
+    hash_vectors = np.array([video_index.reconstruct(i) for i in range(video_index.ntotal)]) # Retrieve original indices
+    # Target video (long video)
+    target_indices = [index_hashes_for_video(x) for x in [target]]
+    return video_index, hash_vectors, target_indices
+def compare_videos(hash_vectors, target_indices, MIN_DISTANCE = 3):
+    """ Search for matches between the indices of the  target video (long video)
+    and the given hash vectors of a video"""
+    # The results are returned as a triplet of 1D arrays
+    # lims, D, I, where result for query i is in I[lims[i]:lims[i+1]]
+    # (indices of neighbors), D[lims[i]:lims[i+1]] (distances).
+    for index in target_indices:
+        lims, D, I = index.range_search(hash_vectors, MIN_DISTANCE)
+        return lims, D, I, hash_vectors
+def get_decent_distance(url, target, MIN_DISTANCE, MAX_DISTANCE):
+    """ To get a decent heurstic for a base distance check every distance from MIN_DISTANCE to MAX_DISTANCE
+    until the number of matches found is equal to or higher than the number of frames in the source video"""
+    for distance in np.arange(start = MIN_DISTANCE - 2, stop = MAX_DISTANCE + 2, step = 2, dtype=int):
+        distance = int(distance)
+        video_index, hash_vectors, target_indices = get_video_indices(url, target, MIN_DISTANCE = distance)
+        lims, D, I, hash_vectors = compare_videos(hash_vectors, target_indices, MIN_DISTANCE = distance)
+        nr_source_frames = video_index.ntotal
+        nr_matches = len(D)
+        logging.info(f"{(nr_matches/nr_source_frames) * 100.0:.1f}% of frames have a match for distance '{distance}' ({nr_matches} matches for {nr_source_frames} frames)")
+        if nr_matches >= nr_source_frames:
+            return distance
+    logging.warning(f"No matches found for any distance between {MIN_DISTANCE} and {MAX_DISTANCE}")
+    return None
+def get_change_points(df, smoothing_window_size=10, method='CUSUM'):
+    tsd = TimeSeriesData(df.loc[:,['time','OFFSET_LIP']])
+    if method.upper() == "CUSUM":
+        detector = CUSUMDetector(tsd)
+    elif method.upper() == "ROBUST":
+        detector = RobustStatDetector(tsd)
+    change_points =  detector.detector(smoothing_window_size=smoothing_window_size, comparison_window=-2)
+    # Print some stats
+    if method.upper() == "CUSUM" and change_points != []:
+        mean_offset_prechange = change_points[0].mu0
+        mean_offset_postchange = change_points[0].mu1
+        jump_s = mean_offset_postchange - mean_offset_prechange
+        print(f"Video jumps {jump_s:.1f}s in time at {mean_offset_prechange:.1f} seconds")
+    return change_points