mirror of
https://github.com/YaoFANGUK/video-subtitle-remover.git
synced 2026-02-26 21:54:41 +08:00
88 lines
3.0 KiB
Python
Executable File
88 lines
3.0 KiB
Python
Executable File
#!/usr/bin/env python3
|
|
|
|
import os
|
|
|
|
import numpy as np
|
|
import tqdm
|
|
from skimage import io
|
|
from skimage.segmentation import mark_boundaries
|
|
|
|
from saicinpainting.evaluation.data import InpaintingDataset
|
|
from saicinpainting.evaluation.vis import save_item_for_vis
|
|
|
|
def save_mask_for_sidebyside(item, out_file):
|
|
mask = item['mask']# > 0.5
|
|
if mask.ndim == 3:
|
|
mask = mask[0]
|
|
mask = np.clip(mask * 255, 0, 255).astype('uint8')
|
|
io.imsave(out_file, mask)
|
|
|
|
def save_img_for_sidebyside(item, out_file):
|
|
img = np.transpose(item['image'], (1, 2, 0))
|
|
img = np.clip(img * 255, 0, 255).astype('uint8')
|
|
io.imsave(out_file, img)
|
|
|
|
def save_masked_img_for_sidebyside(item, out_file):
|
|
mask = item['mask']
|
|
img = item['image']
|
|
|
|
img = (1-mask) * img + mask
|
|
img = np.transpose(img, (1, 2, 0))
|
|
|
|
img = np.clip(img * 255, 0, 255).astype('uint8')
|
|
io.imsave(out_file, img)
|
|
|
|
def main(args):
|
|
dataset = InpaintingDataset(args.datadir, img_suffix='.png')
|
|
|
|
area_bins = np.linspace(0, 1, args.area_bins + 1)
|
|
|
|
heights = []
|
|
widths = []
|
|
image_areas = []
|
|
hole_areas = []
|
|
hole_area_percents = []
|
|
area_bins_count = np.zeros(args.area_bins)
|
|
area_bin_titles = [f'{area_bins[i] * 100:.0f}-{area_bins[i + 1] * 100:.0f}' for i in range(args.area_bins)]
|
|
|
|
bin2i = [[] for _ in range(args.area_bins)]
|
|
|
|
for i, item in enumerate(tqdm.tqdm(dataset)):
|
|
h, w = item['image'].shape[1:]
|
|
heights.append(h)
|
|
widths.append(w)
|
|
full_area = h * w
|
|
image_areas.append(full_area)
|
|
hole_area = (item['mask'] == 1).sum()
|
|
hole_areas.append(hole_area)
|
|
hole_percent = hole_area / full_area
|
|
hole_area_percents.append(hole_percent)
|
|
bin_i = np.clip(np.searchsorted(area_bins, hole_percent) - 1, 0, len(area_bins_count) - 1)
|
|
area_bins_count[bin_i] += 1
|
|
bin2i[bin_i].append(i)
|
|
|
|
os.makedirs(args.outdir, exist_ok=True)
|
|
|
|
for bin_i in range(args.area_bins):
|
|
bindir = os.path.join(args.outdir, area_bin_titles[bin_i])
|
|
os.makedirs(bindir, exist_ok=True)
|
|
bin_idx = bin2i[bin_i]
|
|
for sample_i in np.random.choice(bin_idx, size=min(len(bin_idx), args.samples_n), replace=False):
|
|
item = dataset[sample_i]
|
|
path = os.path.join(bindir, dataset.img_filenames[sample_i].split('/')[-1])
|
|
save_masked_img_for_sidebyside(item, path)
|
|
|
|
|
|
if __name__ == '__main__':
|
|
import argparse
|
|
|
|
aparser = argparse.ArgumentParser()
|
|
aparser.add_argument('--datadir', type=str,
|
|
help='Path to folder with images and masks (output of gen_mask_dataset.py)')
|
|
aparser.add_argument('--outdir', type=str, help='Where to put results')
|
|
aparser.add_argument('--samples-n', type=int, default=10,
|
|
help='Number of sample images with masks to copy for visualization for each area bin')
|
|
aparser.add_argument('--area-bins', type=int, default=10, help='How many area bins to have')
|
|
|
|
main(aparser.parse_args())
|