evaluation and visualization code

drinkingcoder · drinkingcoder · commit 7ae705217511 · 2022-08-09T15:15:31.000+08:00
diff --git a/README.md b/README.md
@@ -66,6 +66,42 @@ We provide [models](https://drive.google.com/drive/folders/1K2dcWxaqOLiQ3PoqRdok
     ├── sintel.pth
     ├── kitti.pth
 ```
+
+## Evaluation
+The model to be evaluated is assigned by the `_CN.model` in the config file.
+
+Evaluating the model on the Sintel training set and the KITTI training set. The corresponding config file is `configs/things_eval.py`.
+```Shell
+python evaluate_FlowFormer_tile.py --eval sintel_validation
+python evaluate_FlowFormer_tile.py --eval kitti_validation
+```
+Generating the submission for the Sintel and KITTI benchmarks. The corresponding config file is `configs/submission.py`.
+```Shell
+python evaluate_FlowFormer_tile.py --eval sintel_submission
+python evaluate_FlowFormer_tile.py --eval kitti_submission
+```
+Visualizing the sintel dataset:
+```Shell
+python visualize_flow.py --eval_type sintel
+```
+Visualizing an image sequence extracted from a video:
+```Shell
+python visualize_flow.py --eval_type seq
+```
+The default image sequence format is:
+```Shell
+├── demo_data
+    ├── mihoyo
+        ├── 000001.png
+        ├── 000002.png
+        ├── 000003.png
+            .
+            .
+            .
+        ├── 001000.png
+```
+
+
 ## License
 FlowFormer is released under the Apache License
 
diff --git a/evaluate_FlowFormer_tile.py b/evaluate_FlowFormer_tile.py
@@ -300,7 +300,6 @@ def validate_sintel(model, sigma=0.05):
 
 if __name__ == '__main__':
     parser = argparse.ArgumentParser()
-    parser.add_argument('--dataset', help="dataset for evaluation")
     parser.add_argument('--eval', help='eval benchmark')
     args = parser.parse_args()
 
diff --git a/visualize_flow.py b/visualize_flow.py
@@ -0,0 +1,202 @@
+import sys
+sys.path.append('core')
+
+from PIL import Image
+from glob import glob
+import argparse
+import os
+import time
+import numpy as np
+import torch
+import torch.nn.functional as F
+import matplotlib.pyplot as plt
+from configs.submission import get_cfg
+from core.utils.misc import process_cfg
+import datasets
+from utils import flow_viz
+from utils import frame_utils
+import cv2
+import math
+import os.path as osp
+
+from core.FlowFormer import build_flowformer
+
+from utils.utils import InputPadder, forward_interpolate
+import itertools
+
+TRAIN_SIZE = [432, 960]
+
+
+def compute_grid_indices(image_shape, patch_size=TRAIN_SIZE, min_overlap=20):
+  if min_overlap >= TRAIN_SIZE[0] or min_overlap >= TRAIN_SIZE[1]:
+    raise ValueError(
+        f"Overlap should be less than size of patch (got {min_overlap}"
+        f"for patch size {patch_size}).")
+  if image_shape[0] == TRAIN_SIZE[0]:
+    hs = list(range(0, image_shape[0], TRAIN_SIZE[0]))
+  else:
+    hs = list(range(0, image_shape[0], TRAIN_SIZE[0] - min_overlap))
+  if image_shape[1] == TRAIN_SIZE[1]:
+    ws = list(range(0, image_shape[1], TRAIN_SIZE[1]))
+  else:
+    ws = list(range(0, image_shape[1], TRAIN_SIZE[1] - min_overlap))
+
+  # Make sure the final patch is flush with the image boundary
+  hs[-1] = image_shape[0] - patch_size[0]
+  ws[-1] = image_shape[1] - patch_size[1]
+  return [(h, w) for h in hs for w in ws]
+
+def compute_weight(hws, image_shape, patch_size=TRAIN_SIZE, sigma=1.0, wtype='gaussian'):
+    patch_num = len(hws)
+    h, w = torch.meshgrid(torch.arange(patch_size[0]), torch.arange(patch_size[1]))
+    h, w = h / float(patch_size[0]), w / float(patch_size[1])
+    c_h, c_w = 0.5, 0.5 
+    h, w = h - c_h, w - c_w
+    weights_hw = (h ** 2 + w ** 2) ** 0.5 / sigma
+    denorm = 1 / (sigma * math.sqrt(2 * math.pi))
+    weights_hw = denorm * torch.exp(-0.5 * (weights_hw) ** 2)
+
+    weights = torch.zeros(1, patch_num, *image_shape)
+    for idx, (h, w) in enumerate(hws):
+        weights[:, idx, h:h+patch_size[0], w:w+patch_size[1]] = weights_hw
+    weights = weights.cuda()
+    patch_weights = []
+    for idx, (h, w) in enumerate(hws):
+        patch_weights.append(weights[:, idx:idx+1, h:h+patch_size[0], w:w+patch_size[1]])
+
+    return patch_weights
+
+def compute_flow(model, image1, image2, weights=None):
+    print(f"computing flow...")
+
+    image_size = image1.shape[1:]
+
+    hws = compute_grid_indices(image_size)
+    if weights is None:
+        weights = compute_weight(hws, image_size, sigma=0.05)
+
+    image1, image2 = image1[None].cuda(), image2[None].cuda()
+
+    flows = 0
+    flow_count = 0
+
+    for idx, (h, w) in enumerate(hws):
+        image1_tile = image1[:, :, h:h+TRAIN_SIZE[0], w:w+TRAIN_SIZE[1]]
+        image2_tile = image2[:, :, h:h+TRAIN_SIZE[0], w:w+TRAIN_SIZE[1]]    
+        flow_pre, _ = model(image1_tile, image2_tile)
+        padding = (w, image_size[1]-w-TRAIN_SIZE[1], h, image_size[0]-h-TRAIN_SIZE[0], 0, 0)
+        flows += F.pad(flow_pre * weights[idx], padding)
+        # flow_count += F.pad(weights, padding)
+        flow_count += F.pad(weights[idx], padding)
+
+    flow_pre = flows / flow_count
+    flow = flow_pre[0].permute(1, 2, 0).cpu().numpy()
+
+    return flow, weights
+
+def compute_adaptive_image_size(image_size):
+    target_size = TRAIN_SIZE
+    scale0 = target_size[0] / image_size[0]
+    scale1 = target_size[1] / image_size[1] 
+
+    if scale0 > scale1:
+        scale = scale0
+    else:
+        scale = scale1
+
+    image_size = (int(image_size[1] * scale), int(image_size[0] * scale))
+
+    return image_size
+
+def prepare_image(root_dir, viz_root_dir, fn1, fn2):
+    print(f"preparing image...")
+    print(f"root dir = {root_dir}, fn = {fn1}")
+
+    image1 = frame_utils.read_gen(osp.join(root_dir, fn1))
+    image2 = frame_utils.read_gen(osp.join(root_dir, fn2))
+    image1 = np.array(image1).astype(np.uint8)[..., :3]
+    image2 = np.array(image2).astype(np.uint8)[..., :3]
+    dsize = compute_adaptive_image_size(image1.shape[0:2])
+    image1 = cv2.resize(image1, dsize=dsize, interpolation=cv2.INTER_CUBIC)
+    image2 = cv2.resize(image2, dsize=dsize, interpolation=cv2.INTER_CUBIC)
+    image1 = torch.from_numpy(image1).permute(2, 0, 1).float()
+    image2 = torch.from_numpy(image2).permute(2, 0, 1).float()
+
+
+    dirname = osp.dirname(fn1)
+    filename = osp.splitext(osp.basename(fn1))[0]
+
+    viz_dir = osp.join(viz_root_dir, dirname)
+    if not osp.exists(viz_dir):
+        os.makedirs(viz_dir)
+
+    viz_fn = osp.join(viz_dir, filename + '.png')
+
+    return image1, image2, viz_fn
+
+def build_model():
+    print(f"building  model...")
+    cfg = get_cfg()
+    model = torch.nn.DataParallel(build_flowformer(cfg))
+    model.load_state_dict(torch.load(cfg.model))
+
+    model.cuda()
+    model.eval()
+
+    return model
+
+def visualize_flow(root_dir, viz_root_dir, model, img_pairs):
+    weights = None
+    for img_pair in img_pairs:
+        fn1, fn2 = img_pair
+        print(f"processing {fn1}, {fn2}...")
+
+        image1, image2, viz_fn = prepare_image(root_dir, viz_root_dir, fn1, fn2)
+        flow, weights = compute_flow(model, image1, image2, weights)
+        flow_img = flow_viz.flow_to_image(flow)
+        cv2.imwrite(viz_fn, flow_img[:, :, [2,1,0]])
+
+def process_sintel(sintel_dir):
+    img_pairs = []
+    for scene in os.listdir(sintel_dir):
+        dirname = osp.join(sintel_dir, scene)
+        image_list = sorted(glob(osp.join(dirname, '*.png')))
+        for i in range(len(image_list)-1):
+            img_pairs.append((image_list[i], image_list[i+1]))
+
+    return img_pairs
+
+def generate_pairs(dirname, start_idx, end_idx):
+    img_pairs = []
+    for idx in range(start_idx, end_idx):
+        img1 = osp.join(dirname, f'{idx:06}.png')
+        img2 = osp.join(dirname, f'{idx+1:06}.png')
+        # img1 = f'{idx:06}.png'
+        # img2 = f'{idx+1:06}.png'
+        img_pairs.append((img1, img2))
+
+    return img_pairs
+
+if __name__ == '__main__':
+    parser = argparse.ArgumentParser()
+    parser.add_argument('--eval_type', default='sintel')
+    parser.add_argument('--start_idx', type=int, default=1)
+    parser.add_argument('--end_idx', type=int, default=1200)
+    parser.add_argument('--root_dir', default='.')
+    parser.add_argument('--sintel_dir', default='datasets/Sintel/test/clean')
+    parser.add_argument('--seq_dir', default='demo_data/mihoyo')
+    parser.add_argument('--viz_root_dir', default='viz_results')
+
+    args = parser.parse_args()
+
+    root_dir = args.root_dir
+    viz_root_dir = args.viz_root_dir
+
+    model = build_model()
+
+    if args.eval_type == 'sintel':
+        img_pairs = process_sintel(args.sintel_dir)
+    elif args.eval_type == 'seq':
+        img_pairs = generate_pairs(args.seq_dir, args.start_idx, args.end_idx)
+    with torch.no_grad():
+        visualize_flow(root_dir, viz_root_dir, model, img_pairs)