Video-Summarization/similarity.py at main · spesavento/Video-Summarization · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
#!/usr/bin/env python

# python -m pip install -U scikit-image
# (also Cython, numpy, scipi, matplotlib, networkx, pillow, imageio, tifffile, PyWavelets)
from skimage import data, img_as_float
from skimage.metrics import structural_similarity as ssim
# from skimage.metrics import mean_squared_error
# import numpy as np
import cv2
# import glob
# import numpy as np
import os
from os.path import isfile, join

# Creates an array of shot-change frames
def ShotChange(full_frame_path):
    print ('determining shot changes ...this might take a minute')
    # create array of file images and sort them
    # files = [f for f in os.listdir(full_frame_path) if isfile(join(full_frame_path,f))]
    # files.sort()
    files = os.listdir(full_frame_path)
    # number of frames in folder
    num = len(files)
    # initialize the shot change array variable
    # keep the very first frame as a scene change
    shot_change = [0]
    # initialize the first 3 frames
    last_frame = 0
    # calculate the ssim on the first 3 frames
    # 4 JSON frames - a b c d - comparisions: ab, bc, cd
    # if bc goes down far enough, that is considered a new shot
    frame_a = cv2.imread(full_frame_path+'frame0.jpg')
    frame_b = cv2.imread(full_frame_path+'frame1.jpg')
    frame_c = cv2.imread(full_frame_path+'frame2.jpg')
    frame_a_bw = cv2.cvtColor(frame_a, cv2.COLOR_BGR2GRAY)
    frame_b_bw = cv2.cvtColor(frame_b, cv2.COLOR_BGR2GRAY)
    frame_c_bw = cv2.cvtColor(frame_c, cv2.COLOR_BGR2GRAY)
    ssim_ab = ssim(frame_a_bw, frame_b_bw)
    ssim_bc = ssim(frame_b_bw, frame_c_bw)
    # now loop through all frames to look for "local minimums"
    # only go up to number of frames-3
    for i in range(0, num-3):
        # read in four frames to opencv
        frame_d = cv2.imread(full_frame_path+'frame'+str(i+3)+'.jpg')
        # convert them to grayscale
        frame_d_bw = cv2.cvtColor(frame_d, cv2.COLOR_BGR2GRAY)
        # calculate ssim between adjacent frames
        ssim_cd = ssim(frame_c_bw, frame_d_bw)
        # we have ssim_ab, ssim_bc, ssim_cd ... we want to know if ssim_bc is a "local minimum"
        # for now 0.6 is randomly chosen, seems to work OK
        # is similarity of bc low compared to ab and cd, don't accept shot similarity if less than 20 frames
        if (ssim_bc/ssim_ab < 0.6 and ssim_bc/ssim_cd < 0.6 and i-last_frame > 20):
            # print ('shot change frame '+ str(i+2))
            # for comparision to next shot
            last_frame = i+2
            # build the shot_change array with the frame numbers where change happens
            shot_change.append(i+2)
        # slide the window
        ssim_ab = ssim_bc
        ssim_bc = ssim_cd
        frame_c_bw = frame_d_bw
    print('shot change array is:')
    print(shot_change)
    return shot_change

# Take each Shot section and reduce it 1:6
# This is too simple, just taking every 6th frame, but identifying the shots
def MakeSummaryFrames(full_frame_path,summary_frame_path, shot_change):
    print ('storing summary frames in '+summary_frame_path+'...')
    num_shots = len(shot_change)
    # z = 0
    for i in range (0, num_shots-1):
        frame_a = shot_change[i]
        frame_b = shot_change[i+1]
        num_frames_in_shot = frame_b - frame_a
        num_frames_to_keep = int(num_frames_in_shot/6)
        save_frame = frame_a
        for y in range (0, num_frames_to_keep):
            # save every 6th frame
            save_frame = save_frame + 6
            summary_image = full_frame_path+'frame'+str(save_frame)+'.jpg'
            img = cv2.imread(summary_image)
            # write the shot numbers on the summary frames
            cv2.putText(
                img, #numpy image
                str(i), #text
                (10,60), #position
                cv2.FONT_HERSHEY_SIMPLEX, #font
                2, #font size
                (0, 0, 255), #font color red in BGR
                4) #font stroke
            #saves alphabetically
            alpha_number = str(save_frame).zfill(5)
            summary_frame_img = summary_frame_path+alpha_number+'.jpg'
            #write to summary frame folder
            cv2.imwrite(summary_frame_img,img)
            # z = z+1

# Convert frames folder to video using OpenCV
def FramesToVideo(summary_frame_path,pathOut,fps,frame_width,frame_height):
    frame_array = []
    files = [f for f in os.listdir(summary_frame_path) if isfile(join(summary_frame_path,f))]
    # sort the files
    # see python reference https://docs.python.org/3/howto/sorting.html
    files.sort()
    for i in range(len(files)):
        filename=summary_frame_path+files[i]
        #reading each files
        img = cv2.imread(filename)
        # height, width, layers = img.shape
        # size = (width,height)
        # print(filename)
        #inserting the frames into an image array
        frame_array.append(img)
    # define the parameters for creating the video
    # .mp4 is a good choice for playing videos, works on OSX and Windows
    fourcc = cv2.VideoWriter_fourcc(*'MP4V')
    out = cv2.VideoWriter(pathOut, fourcc, fps, (frame_width,frame_height))
    # create the video from frame array
    for i in range(len(frame_array)):
        # writing to a image array
        out.write(frame_array[i])
    out.release()


def main():

    # directory of full video frames - ordered frame1.jpg, frame2.jpg, etc.
    full_frame_path = "../../project_files/project_dataset/frames/soccer/"

    # directory for summary frames
    summary_frame_path = "../../project_files/summary/soccer/frames/"

    # directory for summary video
    summary_video_path = '../../project_files/summary/soccer/video/soccer.mp4'

    # get shot_change array
    shot_change = ShotChange(full_frame_path)

    # make summary frame folder
    MakeSummaryFrames(full_frame_path,summary_frame_path,shot_change)

    # make a video from the summary frame folder
    FramesToVideo(summary_frame_path, summary_video_path, 30, 320, 180)

if __name__=="__main__":
    main()