评价与推理

2022-02-10 19:26:45 +08:00 · 2022-02-10 19:26:45 +08:00 · 48a2b96e71
parent 4424ab5b72
commit 48a2b96e71
2 changed files with 157 additions and 0 deletions
--- a/src/eval.py
+++ b/src/eval.py
@ -0,0 +1,72 @@
 import numpy as np
 from glob import glob
 from src.models.modnet import MODNet
 from PIL import Image
 from src.infer import predit_matte
 import torch.nn as nn
 import torch
 def cal_mad(pred, gt):
    diff = pred - gt
    diff = np.abs(diff)
    mad = np.mean(diff)
    return mad
 def cal_mse(pred, gt):
    diff = pred - gt
    diff = diff ** 2
    mse = np.mean(diff)
    return mse
 def load_eval_dataset(dataset_root_dir='src/datasets/PPM-100'):
    image_path = dataset_root_dir + '/image/*'
    matte_path = dataset_root_dir + '/matte/*'
    image_file_name_list = glob(image_path)
    image_file_name_list = sorted(image_file_name_list)
    matte_file_name_list = glob(matte_path)
    matte_file_name_list = sorted(matte_file_name_list)
    return image_file_name_list, matte_file_name_list
 def eval(modnet: MODNet, dataset):
    mse = total_mse = 0.0
    mad = total_mad = 0.0
    cnt = 0
    for im_pth, mt_pth in zip(dataset[0], dataset[1]):
        im = Image.open(im_pth)
        pd_matte = predit_matte(modnet, im)
        gt_matte = Image.open(mt_pth)
        gt_matte = np.asarray(gt_matte) / 255
        total_mse += cal_mse(pd_matte, gt_matte)
        total_mad += cal_mad(pd_matte, gt_matte)
        cnt += 1
    if cnt > 0:
        mse = total_mse / cnt
        mad = total_mad / cnt
    return mse, mad
 if __name__ == '__main__':
    # create MODNet and load the pre-trained ckpt
    modnet = MODNet(backbone_pretrained=False)
    modnet = nn.DataParallel(modnet)
    ckp_pth = 'pretrained/modnet_photographic_portrait_matting.ckpt'
    if torch.cuda.is_available():
        modnet = modnet.cuda()
        weights = torch.load(ckp_pth)
    else:
        weights = torch.load(ckp_pth, map_location=torch.device('cpu'))
    modnet.load_state_dict(weights)
    dataset = load_eval_dataset('src/datasets/PPM-100')
    mse, mad = eval(modnet, dataset)
    print(f'mse: {mse:6f}, mad: {mad:6f}')
--- a/src/infer.py
+++ b/src/infer.py
@ -0,0 +1,85 @@
 from src.models.modnet import MODNet
 from PIL import Image
 import numpy as np
 from torchvision import transforms
 import torch
 import torch.nn.functional as F
 import torch.nn as nn
 def predit_matte(modnet: MODNet, im: Image):
    # define image to tensor transform
    im_transform = transforms.Compose(
        [
            transforms.ToTensor(),
            transforms.Normalize((0.5, 0.5, 0.5), (0.5, 0.5, 0.5))
        ]
    )
    # define hyper-parameters
    ref_size = 512
    modnet.eval()
    # unify image channels to 3
    im = np.asarray(im)
    if len(im.shape) == 2:
        im = im[:, :, None]
    if im.shape[2] == 1:
        im = np.repeat(im, 3, axis=2)
    elif im.shape[2] == 4:
        im = im[:, :, 0:3]
    im = Image.fromarray(im)
    # convert image to PyTorch tensor
    im = im_transform(im)
    # add mini-batch dim
    im = im[None, :, :, :]
    # resize image for input
    im_b, im_c, im_h, im_w = im.shape
    if max(im_h, im_w) < ref_size or min(im_h, im_w) > ref_size:
        if im_w >= im_h:
            im_rh = ref_size
            im_rw = int(im_w / im_h * ref_size)
        elif im_w < im_h:
            im_rw = ref_size
            im_rh = int(im_h / im_w * ref_size)
    else:
        im_rh = im_h
        im_rw = im_w
    im_rw = im_rw - im_rw % 32
    im_rh = im_rh - im_rh % 32
    im = F.interpolate(im, size=(im_rh, im_rw), mode='area')
    # inference
    _, _, matte = modnet(im.cuda() if torch.cuda.is_available() else im, True)
    # resize and save matte
    matte = F.interpolate(matte, size=(im_h, im_w), mode='area')
    matte = matte[0][0].data.cpu().numpy()
    return matte
 if __name__ == '__main__':
    # create MODNet and load the pre-trained ckpt
    modnet = MODNet(backbone_pretrained=False)
    modnet = nn.DataParallel(modnet)
    ckp_pth = 'pretrained/modnet_photographic_portrait_matting.ckpt'
    if torch.cuda.is_available():
        modnet = modnet.cuda()
        weights = torch.load(ckp_pth)
    else:
        weights = torch.load(ckp_pth, map_location=torch.device('cpu'))
    modnet.load_state_dict(weights)
    pth = 'src/datasets/PPM-100/image/13179159164_1a4ae8d085_o.jpg'
    img = Image.open(pth)
    matte = predit_matte(modnet, img)
    prd_img = Image.fromarray(((matte * 255).astype('uint8')), mode='L')
    prd_img.save('test_predic.jpg')