runPaddle_demo_RGB_Depth.py

import os, argparse, time, datetime, sys, shutil, stat
import numpy as np 
from util.util import compute_results, visualize
from sklearn.metrics import confusion_matrix
from scipy.io import savemat 
import paddle
from paddle.io import DataLoader
from util.RGB_Depth_dataset import RGB_Depth_dataset
from paddle_model import InconSeg


#############################################################################################
parser = argparse.ArgumentParser(description='Test with pytorch')
#############################################################################################
parser.add_argument('--model_name', '-m', type=str, default='InconSeg')
parser.add_argument('--weight_name', '-w', type=str, default='PaddleInconSe_RGB_Depth') 
parser.add_argument('--file_name', '-f', type=str, default='final.pdparams')
parser.add_argument('--dataset_split', '-d', type=str, default='test') # abnormal_test, normal_test, urban_test, rural_test
parser.add_argument('--gpu', '-g', type=int, default=0)
#############################################################################################
parser.add_argument('--img_height', '-ih', type=int, default=288) 
parser.add_argument('--img_width', '-iw', type=int, default=512)  
parser.add_argument('--num_workers', '-j', type=int, default=1)
parser.add_argument('--n_class', '-nc', type=int, default=3)
parser.add_argument('--data_dir', '-dr', type=str, default='./dataset/')
parser.add_argument('--model_dir', '-wd', type=str, default='./weights_backup/')
args = parser.parse_args()
#############################################################################################

if __name__ == '__main__':
  
    paddle.device.set_device('gpu:0')

    # prepare save direcotry
    if os.path.exists("./runs"):
        print("previous \"./runs\" folder exist, will delete this folder")
        shutil.rmtree("./runs")
    os.makedirs("./runs")
    os.chmod("./runs", stat.S_IRWXO)  # allow the folder created by docker read, written, and execuated by local machine
    model_dir = os.path.join(args.model_dir, args.weight_name)
    
    if os.path.exists(model_dir) is False:
        sys.exit("the %s does not exit." %(model_dir))
    model_file = os.path.join(model_dir, args.file_name)
    if os.path.exists(model_file) is True:
        print('use the final model file.')
    else:
        sys.exit('no model file found.') 
    print('testing %s: %s on GPU #%d with pytorch' % (args.model_name, args.weight_name, args.gpu))
    
    conf_total = np.zeros((args.n_class, args.n_class))
    model = eval(args.model_name)(n_class=args.n_class)
    # if args.gpu >= 0: model.cuda(args.gpu)
    print('loading model file %s... ' % model_file)


    paddle_weight = paddle.load(model_file)
    model.set_state_dict(paddle_weight)


    batch_size = 1
    test_dataset  = RGB_Depth_dataset(data_dir=args.data_dir, split=args.dataset_split, input_h=args.img_height, input_w=args.img_width)
    test_loader  = DataLoader(
        dataset     = test_dataset,
        batch_size  = batch_size,
        shuffle     = False,
        num_workers = args.num_workers,
        drop_last   = False
    )
    ave_time_cost = 0.0

    model.eval()
    with paddle.no_grad():
        for it, (images, labels, names) in enumerate(test_loader):

            images = images.numpy()
            images = paddle.to_tensor(images)

            labels = labels.numpy()
            labels = paddle.to_tensor(labels)


            paddle.device.cuda.synchronize()
            start_time = time.time()
            depth_result, rgb_result,rgb_seg_f1,depth_add_f1,rgb_seg_f2,depth_add_f2,rgb_seg_f3,depth_add_f3 = model(images)  
            paddle.device.cuda.synchronize()

            end_time = time.time()
            logits = rgb_result
            if it>=5: # # ignore the first 5 frames
                ave_time_cost += (end_time-start_time)
            # convert tensor to numpy 1d array
            label = labels.cpu().numpy().squeeze().flatten()
            prediction = logits.argmax(1).cpu().numpy().squeeze().flatten() # prediction and label are both 1-d array, size: minibatch*640*480
            # generate confusion matrix frame-by-frame
            conf = confusion_matrix(y_true=label, y_pred=prediction, labels=[0,1,2]) # conf is an n_class*n_class matrix, vertical axis: groundtruth, horizontal axis: prediction
            conf_total += conf
            # save demo images
            visualize(image_name=names, predictions=logits.argmax(1), weight_name=args.weight_name)
            print("%s, %s, frame %d/%d, %s, time cost: %.2f ms, demo result saved."
                 %(args.model_name, args.weight_name, it+1, len(test_loader), names, (end_time-start_time)*1000))
 
    precision_per_class, recall_per_class, iou_per_class,F1_per_class = compute_results(conf_total)
    conf_total_matfile = os.path.join("./runs", 'conf_'+args.weight_name+'.mat')
    savemat(conf_total_matfile,  {'conf': conf_total}) # 'conf' is the variable name when loaded in Matlab
 
    print('\n###########################################################################')
    print('\n%s: %s test results (with batch size %d) on %s using %s:' %(args.model_name, args.weight_name, batch_size, datetime.date.today(), paddle.device.cuda.get_device_name(args.gpu))) 
    print('\n* the tested dataset name: %s' % args.dataset_split)
    print('* the tested image count: %d' % len(test_loader))
    print('* the tested image size: %d*%d' %(args.img_height, args.img_width)) 
    print('* the weight name: %s' %args.weight_name) 
    print('* the file name: %s' %args.file_name) 
    print("* pre per class: \n    unlabeled: %.6f, negative: %.6f, positive: %.6f" \
          %(precision_per_class[0]*100, precision_per_class[1]*100, precision_per_class[2]*100)) 
    print("* recall per class: \n    unlabeled: %.6f, negative: %.6f, positive: %.6f" \
          %(recall_per_class[0]*100, recall_per_class[1]*100, recall_per_class[2]*100))
    print("* F1 per class: \n    unlabeled: %.6f, negative: %.6f, positive: %.6f" \
          %(F1_per_class[0]*100, F1_per_class[1]*100, F1_per_class[2]*100)) 
    print("* iou per class: \n    unlabeled: %.6f, negative: %.6f, positive: %.6f" \
          %(iou_per_class[0]*100, iou_per_class[1]*100, iou_per_class[2]*100)) 


    print("\n* average values (np.mean(x)): \n pre: %.6f, recall: %.6f, F1: %.6f, iou: %.6f" \
          %(precision_per_class[:].mean()*100, recall_per_class[:].mean()*100, F1_per_class[:].mean()*100, iou_per_class[:].mean()*100))
    print("* average values (np.mean(np.nan_to_num(x))): \n pre: %.6f, recall: %.6f, F1: %.6f, iou: %.6f" \
          %(np.mean(np.nan_to_num(precision_per_class[:]*100)), np.mean(np.nan_to_num(recall_per_class[:]*100)), np.mean(np.nan_to_num(F1_per_class[:]*100)), np.mean(np.nan_to_num(iou_per_class[:]*100))))
    print('\n* the average time cost per frame (with batch size %d): %.2f ms, namely, the inference speed is %.2f fps' %(batch_size, ave_time_cost*1000/(len(test_loader)-5), 1.0/(ave_time_cost/(len(test_loader)-5)))) # ignore the first 10 frames
    #print('\n* the total confusion matrix: ') 
    #np.set_printoptions(precision=8, threshold=np.inf, linewidth=np.inf, suppress=True)
    #print(conf_total)
    print('\n###########################################################################')