File size: 3,226 Bytes
24eb05d
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
#!/usr/bin/env python3
import glob
import logging
import os
import shutil
import sys
import traceback

from saicinpainting.evaluation.data import load_image
from saicinpainting.evaluation.utils import move_to_device

os.environ['OMP_NUM_THREADS'] = '1'
os.environ['OPENBLAS_NUM_THREADS'] = '1'
os.environ['MKL_NUM_THREADS'] = '1'
os.environ['VECLIB_MAXIMUM_THREADS'] = '1'
os.environ['NUMEXPR_NUM_THREADS'] = '1'

import cv2
import hydra
import numpy as np
import torch
import tqdm
import yaml
from omegaconf import OmegaConf
from torch.utils.data._utils.collate import default_collate

from saicinpainting.training.data.datasets import make_default_val_dataset
from saicinpainting.training.trainers import load_checkpoint
from saicinpainting.utils import register_debug_signal_handlers

LOGGER = logging.getLogger(__name__)


def main(args):
    try:
        if not args.indir.endswith('/'):
            args.indir += '/'

        for in_img in glob.glob(os.path.join(args.indir, '**', '*' + args.img_suffix), recursive=True):
            if 'mask' in os.path.basename(in_img):
                continue

            out_img_path = os.path.join(args.outdir, os.path.splitext(in_img[len(args.indir):])[0] + '.png')
            out_mask_path = f'{os.path.splitext(out_img_path)[0]}_mask.png'

            os.makedirs(os.path.dirname(out_img_path), exist_ok=True)

            img = load_image(in_img)
            height, width = img.shape[1:]
            pad_h, pad_w = int(height * args.coef / 2), int(width * args.coef / 2)

            mask = np.zeros((height, width), dtype='uint8')

            if args.expand:
                img = np.pad(img, ((0, 0), (pad_h, pad_h), (pad_w, pad_w)))
                mask = np.pad(mask, ((pad_h, pad_h), (pad_w, pad_w)), mode='constant', constant_values=255)
            else:
                mask[:pad_h] = 255
                mask[-pad_h:] = 255
                mask[:, :pad_w] = 255
                mask[:, -pad_w:] = 255

            # img = np.pad(img, ((0, 0), (pad_h * 2, pad_h * 2), (pad_w * 2, pad_w * 2)), mode='symmetric')
            # mask = np.pad(mask, ((pad_h * 2, pad_h * 2), (pad_w * 2, pad_w * 2)), mode = 'symmetric')

            img = np.clip(np.transpose(img, (1, 2, 0)) * 255, 0, 255).astype('uint8')
            img = cv2.cvtColor(img, cv2.COLOR_RGB2BGR)
            cv2.imwrite(out_img_path, img)

            cv2.imwrite(out_mask_path, mask)
    except KeyboardInterrupt:
        LOGGER.warning('Interrupted by user')
    except Exception as ex:
        LOGGER.critical(f'Prediction failed due to {ex}:\n{traceback.format_exc()}')
        sys.exit(1)


if __name__ == '__main__':
    import argparse

    aparser = argparse.ArgumentParser()
    aparser.add_argument('indir', type=str, help='Root directory with images')
    aparser.add_argument('outdir', type=str, help='Where to store results')
    aparser.add_argument('--img-suffix', type=str, default='.png', help='Input image extension')
    aparser.add_argument('--expand', action='store_true', help='Generate mask by padding (true) or by cropping (false)')
    aparser.add_argument('--coef', type=float, default=0.2, help='How much to crop/expand in order to get masks')

    main(aparser.parse_args())