-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathvideo_analysis.py
203 lines (164 loc) · 7.57 KB
/
video_analysis.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
import cv2
import numpy as np
import matplotlib.pyplot as plt
from matplotlib.animation import FFMpegWriter
import argparse
import sys
#import pickle
from similarity_metrics.fsim_quality import FSIMsimilarity
from similarity_metrics.issm_quality import ISSMsimilarity
from CopulaSimilarity.CSM import CopulaBasedSimilarity as CSIMSimilarity
from similarity_metrics.ssim_rmse_psnr_metrics import ssim
class SimilarityMetrics:
def __init__(self, patch_size=8):
self.fsim_similarity = FSIMsimilarity()
self.issm_similarity = ISSMsimilarity()
self.copula_similarity = CSIMSimilarity(patch_size=patch_size)
def compute_ssim(self, reference_frame, current_frame):
return ssim(reference_frame, current_frame)
def compute_fsim(self, reference_frame, current_frame):
return self.fsim_similarity.fsim(reference_frame, current_frame)
def compute_issm(self, reference_frame, current_frame):
return self.issm_similarity.issm(reference_frame, current_frame)
def compute_csim(self, reference_frame, current_frame):
csim = self.copula_similarity.compute_local_similarity(reference_frame, current_frame)
return csim, np.mean(csim)
def update_progress_bar(total_frames, processed_frames, bar_length=50):
percent_complete = (processed_frames / total_frames) * 100
num_hashes = int((percent_complete / 100) * bar_length)
bar = '#' * num_hashes + '-' * (bar_length - num_hashes)
sys.stdout.write(f'\rProgress: |{bar}| {percent_complete:.2f}%')
sys.stdout.flush()
def process_video(video_path, resolution_factor, output_video, ssim, fsim, issm, save_final_frame, show_live_window, patch_size):
metrics = SimilarityMetrics(patch_size=patch_size)
cap = cv2.VideoCapture(video_path)
if not cap.isOpened():
print("Error: Could not open video file.")
return
total_frames = int(cap.get(cv2.CAP_PROP_FRAME_COUNT))
print(f'Total frames: {total_frames}')
ret, reference_frame = cap.read()
if not ret:
print("Error: Could not read the first frame.")
cap.release()
return
ref_resized = cv2.resize(
reference_frame,
(reference_frame.shape[1] // resolution_factor,
reference_frame.shape[0] // resolution_factor)
)
ref_rgb = cv2.cvtColor(ref_resized, cv2.COLOR_BGR2RGB)
ssim_results = []
fsim_results = []
issm_results = []
csim_results = []
csim_maps = []
frame_indices = []
fig = plt.figure(figsize=(20, 12))
gs = fig.add_gridspec(2, 3, height_ratios=[1, 1.5])
video_ax = fig.add_subplot(gs[0, 0])
diff_ax = fig.add_subplot(gs[0, 1])
csim_ax = fig.add_subplot(gs[0, 2])
plot_ax = fig.add_subplot(gs[1, :])
font_title = 24
font_labels = 20
font_ticks = 18
video_ax.set_title('(a)', fontsize=font_title)
diff_ax.set_title('(b)', fontsize=font_title)
csim_ax.set_title('(c)', fontsize=font_title)
plot_ax.set_title('(d)', fontsize=font_title)
plot_ax.plot([], [], 'g-', label='SSIM')
plot_ax.plot([], [], 'b-', label='FSIM')
plot_ax.plot([], [], 'm-', label='ISSM')
plot_ax.plot([], [], 'r-', label='CSIM')
plot_ax.set_xlim(0, 100)
plot_ax.set_ylim(0, 1)
plot_ax.set_xlabel('Frame Index', fontsize=font_labels)
plot_ax.set_ylabel('Metric Value', fontsize=font_labels)
plot_ax.legend(loc='lower left', fontsize=font_labels)
for ax in [video_ax, diff_ax, csim_ax, plot_ax]:
ax.tick_params(axis='both', which='major', labelsize=font_ticks)
writer = FFMpegWriter(fps=30, codec='libx264')
with writer.saving(fig, output_video, dpi=100):
frame_count = 0
while True:
ret, frame = cap.read()
if not ret:
break
current_resized = cv2.resize(
frame,
(ref_resized.shape[1], ref_resized.shape[0])
)
current_rgb = cv2.cvtColor(current_resized, cv2.COLOR_BGR2RGB)
ssim_value = metrics.compute_ssim(ref_rgb, current_rgb)
fsim_value = metrics.compute_fsim(ref_rgb, current_rgb)
issm_value = metrics.compute_issm(ref_rgb, current_rgb)
csim_map, csim_mean = metrics.compute_csim(ref_rgb, current_rgb)
diff_frame = cv2.absdiff(current_rgb, ref_rgb)
frame_indices.append(frame_count)
if ssim:
ssim_results.append(ssim_value)
if fsim:
fsim_results.append(fsim_value)
if issm:
issm_results.append(issm_value)
csim_results.append(csim_mean)
csim_maps.append(csim_map)
video_ax.imshow(current_rgb)
video_ax.axis('off')
diff_rgb = cv2.cvtColor(diff_frame, cv2.COLOR_BGR2RGB)
diff_ax.imshow(diff_rgb)
diff_ax.axis('off')
csim_map_resized = cv2.resize(csim_map, (current_resized.shape[1], current_resized.shape[0]))
csim_ax.imshow(csim_map_resized, cmap='hot', interpolation='nearest')
csim_ax.axis('off')
plot_ax.clear()
if ssim:
plot_ax.plot(frame_indices, ssim_results, 'g-', label='SSIM')
if fsim:
plot_ax.plot(frame_indices, fsim_results, 'b-', label='FSIM')
if issm:
plot_ax.plot(frame_indices, issm_results, 'm-', label='ISSM')
plot_ax.plot(frame_indices, csim_results, 'r-', label='CSIM')
plot_ax.set_xlim(0, len(frame_indices))
plot_ax.set_ylim(0, 1)
plot_ax.set_xlabel('Frame Index', fontsize=font_labels)
plot_ax.set_ylabel('Metric Value', fontsize=font_labels)
plot_ax.set_title('(d)', fontsize=font_title)
plot_ax.legend(loc='lower left', fontsize=font_labels)
plt.draw()
writer.grab_frame()
if show_live_window:
plt.pause(0.001)
update_progress_bar(total_frames, frame_count)
frame_count += 1
if save_final_frame:
fig.savefig('final_frame.pdf', bbox_inches='tight')
cap.release()
plt.close(fig)
''' #pickle data saving data (optional)
data = {
'frame_indices': frame_indices,
'ssim_results': ssim_results,
'fsim_results': fsim_results,
'issm_results': issm_results,
'csim_results': csim_results,
'csim_maps': csim_maps
}
with open('similarity_metrics_data.pkl', 'wb') as f:
pickle.dump(data, f)
print("Data has been saved to similarity_metrics_data.pkl")
'''
if __name__ == "__main__":
parser = argparse.ArgumentParser(description='Video analysis')
parser.add_argument('--path_to_video', help='Path to video file')
parser.add_argument('--output_video_path', help='Path to output video file')
parser.add_argument('--ssim', action='store_true', help='Compute SSIM')
parser.add_argument('--fsim', action='store_true', help='Compute FSIM')
parser.add_argument('--issm', action='store_true', help='Compute ISSM')
parser.add_argument('--save_final_frame', action='store_true', help='Save final frame')
parser.add_argument('--show_live_window', action='store_true', help='Show live window')
parser.add_argument('--resolution_factor', type=int, default=8, help='Resolution factor')
parser.add_argument('--patch_size', type=int, default=8, help='Patch size for CopulaBasedSimilarity')
args = parser.parse_args()
process_video(args.path_to_video, args.resolution_factor, args.output_video_path, args.ssim, args.fsim, args.issm, args.save_final_frame, args.show_live_window, args.patch_size)