Spaces:
Runtime error
Runtime error
File size: 9,918 Bytes
8c31b90 95312c3 cebe383 8c31b90 df9abf4 24aac30 df9abf4 8c31b90 df9abf4 8c31b90 df9abf4 58538bf 7ce8504 58538bf 3ff595d 58538bf d123883 58538bf 7ce8504 58538bf 026b32c 58538bf 026b32c df9abf4 8b5d61a 8c31b90 0d0ab89 df9abf4 8c31b90 0d0ab89 df9abf4 8c31b90 df9abf4 8c31b90 df9abf4 8c31b90 df9abf4 8c31b90 df9abf4 8f43f06 8c31b90 df9abf4 8f43f06 8c31b90 df9abf4 c103e03 0d0ab89 df9abf4 8c31b90 58538bf b0547a1 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 |
import os
import subprocess
import glob
import streamlit as st
from utils import get_configs, get_display_names, get_path_for_viz, get_video_height, get_text_str
# st.header("EVREAL - Event-based Video Reconstruction Evaluation and Analysis Library")
#
# paper_link = "https://arxiv.org/abs/2305.00434"
# code_link = "https://github.com/ercanburak/EVREAL"
# page_link = "https://ercanburak.github.io/evreal.html"
# instructions_video = "https://www.youtube.com/watch?v="
#
# st.markdown("Paper: " + paper_link, unsafe_allow_html=True)
# st.markdown("Code: " + paper_link, unsafe_allow_html=True)
# st.markdown("Page: " + paper_link, unsafe_allow_html=True)
# st.markdown("Please see this video for instructions on how to use this tool: " + instructions_video, unsafe_allow_html=True)
@st.cache_data(show_spinner="Retrieving results...")
def retrieve_results(selected_dataset, selected_sequence, selected_models, selected_metrics, selected_visualizations):
gt_only_viz = [viz for viz in selected_visualizations if viz['viz_type'] == 'gt_only']
model_only_viz = [viz for viz in selected_visualizations if viz['viz_type'] == 'model_only']
both_viz = [viz for viz in selected_visualizations if viz['viz_type'] == 'both']
recon_viz = {"name": "recon", "display_name": "Reconstruction", "viz_type": "both", "gt_type": "frame"}
ground_truth = {"name": "gt", "display_name": "Ground Truth", "model_id": "groundtruth"}
model_viz = [recon_viz] + both_viz + selected_metrics + model_only_viz
num_model_rows = len(model_viz)
gt_viz = []
if selected_dataset['has_frames']:
gt_viz.append(recon_viz)
gt_viz.extend([viz for viz in both_viz if viz['gt_type'] == 'frame'])
gt_viz.extend([viz for viz in gt_only_viz if viz['gt_type'] == 'frame'])
gt_viz.extend([viz for viz in both_viz if viz['gt_type'] == 'event'])
gt_viz.extend([viz for viz in gt_only_viz if viz['gt_type'] == 'event'])
num_gt_rows = len(gt_viz)
num_rows = max(num_model_rows, num_gt_rows)
# total_videos_needed = len(selected_models) * num_model_rows + num_gt_rows
if len(gt_viz) > 0:
selected_models.append(ground_truth)
padding = 2
font_size = 20
num_cols = len(selected_models)
crop_str = "crop=trunc(iw/2)*2-2:trunc(ih/2)*2,"
pad_str = "pad=ceil(iw/2)*2+{}:ceil(ih/2)*2+{}:{}:{}:white".format(padding*2, padding*2, padding, padding)
num_elements = num_rows * num_cols
# remove previous temp data
files = glob.glob('temp_data/temp_*.mp4')
for f in files:
os.remove(f)
w = selected_dataset["width"]
h = selected_dataset["height"]
input_filter_parts = []
xstack_input_parts = []
layout_parts = []
video_paths = []
row_heights = [""]*num_rows
gt_viz_indices = []
if len(model_viz) > 1:
left_pad = (font_size*0.7)*max([len(viz['display_name']) for viz in model_viz[1:]]) + padding*2
else:
left_pad = 0
for row_idx in range(num_rows):
for col_idx in range(num_cols):
vid_idx = len(video_paths)
# progress_bar.progress(float(vid_idx) / total_videos_needed)
cur_model = selected_models[col_idx]
if cur_model['name'] == "gt":
if row_idx < len(gt_viz):
video_path = get_path_for_viz(base_data_dir, selected_dataset, selected_sequence, cur_model, gt_viz[row_idx])
if not os.path.isfile(video_path):
raise ValueError("Could not find video: " + video_path)
gt_viz_indices.append(vid_idx)
else:
continue
else:
if row_idx < len(model_viz):
video_path = get_path_for_viz(base_data_dir, selected_dataset, selected_sequence, cur_model, model_viz[row_idx])
if not os.path.isfile(video_path):
raise ValueError("Could not find video: " + video_path)
else:
continue
if row_heights[row_idx] == "":
row_heights[row_idx] = "h{}".format(vid_idx)
if row_idx == 0:
pad_height = font_size+padding*2
pad_txt_str = ",pad={}:{}:0:{}:white".format(w+padding*2, h+font_size+padding*4, pad_height)
text_str = get_text_str(pad_height, w, cur_model['display_name'], font_size)
pad_txt_str = pad_txt_str + "," + text_str
elif col_idx == 0:
pad_txt_str = ",pad={}:ih:{}:0:white".format(w + left_pad + padding * 2, left_pad)
if len(model_viz) > row_idx > 0:
text_str = get_text_str("h", left_pad, model_viz[row_idx]['display_name'], font_size)
pad_txt_str = pad_txt_str + "," + text_str
else:
pad_txt_str = ""
input_filter_part = "[{}:v]scale={}:-1,{}{}{}[v{}]".format(vid_idx, w, crop_str, pad_str, pad_txt_str, vid_idx)
input_filter_parts.append(input_filter_part)
xstack_input_part = "[v{}]".format(vid_idx)
xstack_input_parts.append(xstack_input_part)
video_paths.append(video_path)
if row_idx == 0 or col_idx > 0:
layout_w_parts = [str(left_pad)] + ["w{}".format(i) for i in range(col_idx)]
layout_w = "+".join(layout_w_parts)
else:
layout_w = "+".join(["w{}".format(i) for i in range(col_idx)]) if col_idx > 0 else "0"
if cur_model['name'] == "gt":
layout_h = "+".join(["h{}".format(i) for i in gt_viz_indices[:-1]]) if row_idx > 0 else "0"
else:
layout_h = "+".join(row_heights[:row_idx]) if row_idx > 0 else "0"
layout_part = layout_w + "_" + layout_h
layout_parts.append(layout_part)
inputs_str = " ".join(["-i " + video_path for video_path in video_paths])
num_inputs = len(video_paths)
input_scaling_str = ";".join(input_filter_parts)
xstack_input_str = "".join(xstack_input_parts)
layout_str = "|".join(layout_parts)
# opt = "-c:v libx264 -preset veryslow -crf 18 -c:a copy"
opt = ""
# opt_fill = ":fill=black"
opt_fill = ":fill=white"
# opt_fill = ""
if num_inputs > 1:
ffmpeg_command_str = "ffmpeg -y " + inputs_str + " -filter_complex \"" + input_scaling_str + ";" + xstack_input_str + "xstack=inputs=" + str(num_inputs) + ":layout=" + layout_str + opt_fill + "\"" + opt + " output.mp4"
else:
# remove last paranthesis
idx = input_scaling_str.rfind("[")
input_scaling_str = input_scaling_str[:idx]
ffmpeg_command_str = "ffmpeg -y " + inputs_str + " -filter_complex \"" + input_scaling_str + "\"" + opt + " output.mp4"
print(ffmpeg_command_str)
ret = subprocess.call(ffmpeg_command_str, shell=True)
if ret != 0:
return None
video_file = open('output.mp4', 'rb')
video_bytes = video_file.read()
return video_bytes
st.title("Result Analysis Tool")
base_data_dir = "data"
dataset_cfg_path = os.path.join("cfg", "dataset")
model_cfg_path = os.path.join("cfg", "model")
metric_cfg_path = os.path.join("cfg", "metric")
viz_cfg_path = os.path.join("cfg", "viz")
datasets = get_configs(dataset_cfg_path)
models = get_configs(model_cfg_path)
metrics = get_configs(metric_cfg_path)
visualizations = get_configs(viz_cfg_path)
dataset_display_names = get_display_names(datasets)
model_display_names = get_display_names(models)
metric_display_names = get_display_names(metrics)
viz_display_names = get_display_names(visualizations)
assert len(set(dataset_display_names)) == len(dataset_display_names), "Dataset display names are not unique"
assert len(set(model_display_names)) == len(model_display_names), "Model display names are not unique"
assert len(set(metric_display_names)) == len(metric_display_names), "Metric display names are not unique"
assert len(set(viz_display_names)) == len(viz_display_names), "Viz display names are not unique"
col1, col2 = st.columns(2)
with col1:
selected_dataset_name = st.selectbox('Select dataset', options=dataset_display_names)
selected_dataset = [dataset for dataset in datasets if dataset['display_name'] == selected_dataset_name][0]
with col2:
selected_sequence = st.selectbox('Select sequence', options=selected_dataset["sequences"].keys())
selected_model_names = st.multiselect('Select multiple methods to compare', model_display_names)
selected_models = [model for model in models if model['display_name'] in selected_model_names]
disable_metrics = len(selected_models) == 0
if disable_metrics:
tooltip_str = "Select at least one method to enable metric selection"
else:
tooltip_str = ""
usable_metrics = [metric for metric in metrics if metric['no_ref'] == selected_dataset['no_ref']]
usable_metric_display_names = get_display_names(usable_metrics)
selected_metric_names = st.multiselect('Select metrics to display', usable_metric_display_names,
disabled=disable_metrics, help=tooltip_str)
selected_metrics = [metric for metric in usable_metrics if metric['display_name'] in selected_metric_names]
if not selected_dataset['has_frames']:
usable_viz = [viz for viz in visualizations if viz['gt_type'] != 'frame']
else:
usable_viz = visualizations
usable_viz_display_names = get_display_names(usable_viz)
selected_viz = st.multiselect('Select other visualizations to display', usable_viz_display_names)
selected_visualizations = [viz for viz in visualizations if viz['display_name'] in selected_viz]
if not st.button('Get Results'):
st.stop()
video_bytes = retrieve_results(selected_dataset, selected_sequence, selected_models, selected_metrics, selected_visualizations)
if video_bytes is None:
st.error("Error while generating video.")
st.stop()
st.video(video_bytes)
|