Skip to content

Commit

Permalink
Updates
Browse files Browse the repository at this point in the history
  • Loading branch information
SeguinBe committed Apr 3, 2018
1 parent ecfaa98 commit 2359a92
Show file tree
Hide file tree
Showing 11 changed files with 192 additions and 30 deletions.
16 changes: 14 additions & 2 deletions configs/cBAD/cbad_post_processing_configs.json
Original file line number Diff line number Diff line change
@@ -1,7 +1,19 @@
{
"configs":[
{"low_threshold": 0.25, "high_threshold": 0.6},
{"low_threshold": 0.1, "high_threshold": 0.3},
{"low_threshold": 0.3, "high_threshold": 0.7}
{"low_threshold": 0.2, "high_threshold": 0.3},
{"low_threshold": 0.2, "high_threshold": 0.4},
{"low_threshold": 0.3, "high_threshold": 0.4},
{"low_threshold": 0.3, "high_threshold": 0.5},
{"low_threshold": 0.1, "high_threshold": 0.3, "sigma": 1.5},
{"low_threshold": 0.2, "high_threshold": 0.3, "sigma": 1.5},
{"low_threshold": 0.2, "high_threshold": 0.4, "sigma": 1.5},
{"low_threshold": 0.3, "high_threshold": 0.4, "sigma": 1.5},
{"low_threshold": 0.3, "high_threshold": 0.5, "sigma": 1.5},
{"low_threshold": 0.1, "high_threshold": 0.3, "sigma": 2.5},
{"low_threshold": 0.2, "high_threshold": 0.3, "sigma": 2.5},
{"low_threshold": 0.2, "high_threshold": 0.4, "sigma": 2.5},
{"low_threshold": 0.3, "high_threshold": 0.4, "sigma": 2.5},
{"low_threshold": 0.3, "high_threshold": 0.5, "sigma": 2.5}
]
}
12 changes: 12 additions & 0 deletions doc_seg/post_processing/PAGE.py
Original file line number Diff line number Diff line change
Expand Up @@ -273,6 +273,18 @@ def draw_baselines(self, img_canvas, color=(255, 0, 0), thickness=2, endpoint_ra
cv2.circle(img_canvas, (coords[-1, 0, 0], coords[-1, 0, 1]),
radius=endpoint_radius, color=color, thickness=-1)

def draw_textregions(self, img_canvas, color=(255, 0, 0), autoscale=True):
if autoscale:
assert self.image_height is not None
assert self.image_width is not None
ratio = (img_canvas.shape[0]/self.image_height, img_canvas.shape[1]/self.image_width)
else:
ratio = (1, 1)

tr_coords = [(Point.list_to_cv2poly(tr.coords)*ratio).astype(np.int32) for tr in self.text_regions
if len(tr.coords) > 0]
cv2.fillPoly(img_canvas, tr_coords, color)


def parse_file(filename: str) -> Page:
xml_page = ET.parse(filename)
Expand Down
2 changes: 1 addition & 1 deletion doc_seg/post_processing/__init__.py
Original file line number Diff line number Diff line change
@@ -1,4 +1,4 @@

from .segmentation import dibco_binarization_fn, diva_post_processing_fn, page_post_processing_fn
from .segmentation import dibco_binarization_fn
from .line_detection import cbad_post_processing_fn
from .boxes_detection import cini_post_processing_fn, ornaments_post_processing_fn
34 changes: 20 additions & 14 deletions doc_seg/post_processing/line_detection.py
Original file line number Diff line number Diff line change
Expand Up @@ -14,7 +14,7 @@


def cbad_post_processing_fn(probs: np.array, sigma: float=2.5, low_threshold: float=0.8, high_threshold: float=0.9,
output_basename=None):
filter_width: float=0, output_basename=None):
"""
:param probs: output of the model (probabilities) in range [0, 255]
Expand All @@ -28,7 +28,7 @@ def cbad_post_processing_fn(probs: np.array, sigma: float=2.5, low_threshold: fl
WARNING : contours IN OPENCV format List[np.ndarray(n_points, 1, (x,y))]
"""

contours, lines_mask = line_extraction_v1(probs[:, :, 1], sigma, low_threshold, high_threshold)
contours, lines_mask = line_extraction_v1(probs[:, :, 1], sigma, low_threshold, high_threshold, filter_width)
if output_basename is not None:
dump_pickle(output_basename+'.pkl', (contours, lines_mask.shape))
return contours, lines_mask
Expand All @@ -47,25 +47,29 @@ def line_extraction_v0(probs, sigma, threshold):
return contours, lines_mask


def line_extraction_v1(probs, sigma, low_threshold, high_threshold):
# probs_line = probs[:, :, 1]
def line_extraction_v1(probs, low_threshold, high_threshold, sigma=0.0, filter_width=0.00, vertical_maxima=True):
probs_line = probs
# Smooth
probs2 = cv2.GaussianBlur(probs_line, (int(3*sigma)*2+1, int(3*sigma)*2+1), sigma)
local_maxima = vertical_local_maxima(probs2)
lines_mask = hysteresis_thresholding(probs2, local_maxima, low_threshold, high_threshold)
# Remove lines touching border
if sigma > 0.:
probs2 = cv2.GaussianBlur(probs_line, (int(3*sigma)*2+1, int(3*sigma)*2+1), sigma)
else:
probs2 = cv2.fastNlMeansDenoising((probs_line*255).astype(np.uint8), h=50)/255
#probs2 = probs_line
#local_maxima = vertical_local_maxima(probs2)
lines_mask = hysteresis_thresholding(probs2, low_threshold, high_threshold,
candidates=vertical_local_maxima(probs2) if vertical_maxima else None)
#lines_mask = remove_borders(lines_mask)
# Extract polygons from line mask
contours = extract_line_polygons(lines_mask)

filtered_contours = []
page_width = probs.shape[1]
for cnt in contours:
if cv2.arcLength(cnt, False) < 0.05*page_width:
continue
if cv2.arcLength(cnt, False) < 0.05*page_width:
centroid_x, centroid_y = np.mean(cnt, axis=0)[0]
if centroid_x < filter_width*page_width or centroid_x > (1-filter_width)*page_width:
continue
# if cv2.arcLength(cnt, False) < filter_width*page_width:
# continue
filtered_contours.append(cnt)

return filtered_contours, lines_mask
Expand Down Expand Up @@ -153,12 +157,14 @@ def goal_reached(self, int_index, float_cumcost):

def vertical_local_maxima(probs):
local_maxima = np.zeros_like(probs, dtype=bool)
local_maxima[1:-1] = (probs[1:-1] > probs[:-2]) & (probs[2:] < probs[1:-1])
local_maxima[1:-1] = (probs[1:-1] >= probs[:-2]) & (probs[2:] <= probs[1:-1])
return local_maxima


def hysteresis_thresholding(probs: np.array, candidates: np.array, low_threshold: float, high_threshold: float):
low_mask = candidates & (probs > low_threshold)
def hysteresis_thresholding(probs: np.array, low_threshold: float, high_threshold: float, candidates=None):
low_mask = probs > low_threshold
if candidates is not None:
low_mask = candidates & low_mask
# Connected components extraction
label_components, count = label(low_mask, np.ones((3, 3)))
# Keep components with high threshold elements
Expand Down
2 changes: 1 addition & 1 deletion exps/Cini/cini_evaluation.py
Original file line number Diff line number Diff line change
Expand Up @@ -3,7 +3,7 @@
from scipy.misc import imread, imsave, imresize
import cv2
import numpy as np
from .cini_post_processing import cini_post_processing_fn
from cini_post_processing import cini_post_processing_fn
from doc_seg.utils import load_pickle
import pandas as pd

Expand Down
125 changes: 125 additions & 0 deletions exps/Cini/cini_process_set.py
Original file line number Diff line number Diff line change
@@ -0,0 +1,125 @@
#!/usr/bin/env python
__author__ = 'solivr'

import os
import sys

sys.path.append(os.path.abspath(os.path.join(os.path.dirname(__file__), os.path.pardir, os.path.pardir)))
from doc_seg.loader import LoadedModel
from cini_post_processing import cini_post_processing_fn
from cini_evaluation import cini_evaluate_folder

import tensorflow as tf
from tqdm import tqdm
import numpy as np
import argparse
from glob import glob
from scipy.misc import imread, imresize, imsave
import tempfile
import json
from doc_seg.post_processing import PAGE
from doc_seg.utils import hash_dict, dump_json


def predict_on_set(filenames_to_predict, model_dir, output_dir):
"""
:param filenames_to_predict:
:param model_dir:
:param output_dir:
:return:
"""
with tf.Session():
m = LoadedModel(model_dir, 'filename')
for filename in tqdm(filenames_to_predict, desc='Prediction'):
pred = m.predict(filename)['probs'][0]
np.save(os.path.join(output_dir, os.path.basename(filename).split('.')[0]),
np.uint8(255 * pred))


def find_elements(img_filenames, dir_predictions, post_process_params, output_dir, debug=False, mask_dir: str=None):
"""
:param img_filenames:
:param dir_predictions:
:param post_process_params:
:param output_dir:
:return:
"""

os.makedirs(output_dir, exist_ok=True)

for filename in tqdm(img_filenames, 'Post-processing'):
orig_img = imread(filename, mode='RGB')
basename = os.path.basename(filename).split('.')[0]

filename_pred = os.path.join(dir_predictions, basename + '.npy')
pred = np.load(filename_pred)/255 # type: np.ndarray

contours, lines_mask = cini_post_processing_fn(pred, **post_process_params,
output_basename=os.path.join(output_dir, basename))


if __name__ == '__main__':
parser = argparse.ArgumentParser()
parser.add_argument('-m', '--model-dir', type=str, required=True,
help='Directory of the model (should be of type ''*/export/<timestamp>)')
parser.add_argument('-i', '--input-files', type=str, required=True, nargs='+',
help='Folder containing the images to evaluate the model on')
parser.add_argument('-o', '--output-dir', type=str, required=True,
help='Folder containing the outputs (.npy predictions and visualization errors)')
parser.add_argument('-gt', '--ground_truth_dir', type=str, required=True,
help='Ground truth directory containing the labeled images')
parser.add_argument('--params-file', type=str, default=None,
help='JSOn file containing the params for post-processing')
parser.add_argument('--gpu', type=str, default='0', help='Which GPU to use')
parser.add_argument('-pp', '--post-process-only', default=False, action='store_true',
help='Whether to make or not the prediction')
args = parser.parse_args()
args = vars(args)

os.environ["CUDA_VISIBLE_DEVICES"] = args.get('gpu')
model_dir = args.get('model_dir')
input_files = args.get('input_files')
if len(input_files) == 0:
raise FileNotFoundError

output_dir = args.get('output_dir')
os.makedirs(output_dir, exist_ok=True)

# Prediction
npy_directory = output_dir
if not args.get('post_process_only'):
predict_on_set(input_files, model_dir, npy_directory)

npy_files = glob(os.path.join(npy_directory, '*.npy'))

if args.get('params_file') is None:
print('No params file found')
params_list = [{"clean_predictions": True, "advanced": True}]
else:
with open(args.get('params_file'), 'r') as f:
configs_data = json.load(f)
# If the file contains a list of configurations
if 'configs' in configs_data.keys():
params_list = configs_data['configs']
assert isinstance(params_list, list)
# Or if there is a single configuration
else:
params_list = [configs_data]

gt_dir = args.get('ground_truth_dir')

for params in tqdm(params_list, desc='Params'):
print(params)
exp_dir = os.path.join(output_dir, '_' + hash_dict(params))
find_elements(input_files, npy_directory, params, exp_dir, debug=False)

if gt_dir is not None:
scores = cini_evaluate_folder(exp_dir, gt_dir, debug_folder=os.path.join(exp_dir, '_debug'))
dump_json(os.path.join(exp_dir, 'post_process_config.json'), params)
dump_json(os.path.join(exp_dir, 'scores.json'), scores)
print('Scores : {}'.format(scores))



2 changes: 1 addition & 1 deletion exps/DIVA/diva_evaluation.py
Original file line number Diff line number Diff line change
Expand Up @@ -9,7 +9,7 @@
import numpy as np
import cv2
import json
from diva_dataset_generator import MAP_COLORS
from .diva_dataset_generator import MAP_COLORS


DIVA_CLASSES = {
Expand Down
4 changes: 2 additions & 2 deletions exps/__init__.py
Original file line number Diff line number Diff line change
Expand Up @@ -3,9 +3,9 @@
from .Page.page_post_processing import page_post_processing_fn
from .cBAD.cbad_post_processing import cbad_post_processing_fn
from .DIBCO.dibco_post_processing import dibco_binarization_fn
from .Cini.cini_post_processing import cini_post_processing_fn
#from .Cini.cini_post_processing import cini_post_processing_fn
from .DIVA.diva_evaluation import diva_evaluate_folder
from .Cini.cini_evaluation import cini_evaluate_folder
#from .Cini.cini_evaluation import cini_evaluate_folder
from .cBAD.cbad_evaluation import cbad_evaluate_folder
from .DIBCO.dibco_evaluation import dibco_evaluate_folder
from .Ornaments.ornaments_evaluation import ornament_evaluate_folder
Expand Down
12 changes: 7 additions & 5 deletions exps/cBAD/cbad_post_processing.py
Original file line number Diff line number Diff line change
Expand Up @@ -47,16 +47,17 @@ def line_extraction_v0(probs, sigma, threshold):
return contours, lines_mask


def line_extraction_v1(probs, low_threshold, high_threshold, sigma=0.0, filter_width=0.00):
def line_extraction_v1(probs, low_threshold, high_threshold, sigma=0.0, filter_width=0.00, vertical_maxima=False):
probs_line = probs
# Smooth
if sigma > 0.:
probs2 = cv2.GaussianBlur(probs_line, (int(3*sigma)*2+1, int(3*sigma)*2+1), sigma)
else:
probs2 = cv2.fastNlMeansDenoising((probs_line*255).astype(np.uint8), h=50)/255
probs2 = cv2.fastNlMeansDenoising((probs_line*255).astype(np.uint8), h=20)/255
#probs2 = probs_line
#local_maxima = vertical_local_maxima(probs2)
lines_mask = hysteresis_thresholding(probs2, low_threshold, high_threshold)
lines_mask = hysteresis_thresholding(probs2, low_threshold, high_threshold,
candidates=vertical_local_maxima(probs2) if vertical_maxima else None)
# Remove lines touching border
#lines_mask = remove_borders(lines_mask)
# Extract polygons from line mask
Expand Down Expand Up @@ -157,8 +158,9 @@ def goal_reached(self, int_index, float_cumcost):

def vertical_local_maxima(probs):
local_maxima = np.zeros_like(probs, dtype=bool)
local_maxima[1:-1] = (probs[1:-1] > probs[:-2]) & (probs[2:] < probs[1:-1])
return local_maxima
local_maxima[1:-1] = (probs[1:-1] => probs[:-2]) & (probs[2:] <= probs[1:-1])
local_maxima = cv2.morphologyEx(local_maxima.astype(np.uint8), cv2.MORPH_CLOSE, np.ones((5, 5), dtype=np.uint8))
return local_maxima > 0


def hysteresis_thresholding(probs: np.array, low_threshold: float, high_threshold: float, candidates=None):
Expand Down
4 changes: 2 additions & 2 deletions model_selection.py
Original file line number Diff line number Diff line change
Expand Up @@ -55,7 +55,7 @@

# Perform test prediction (is it the right place?)
test_folder = args.get('test_folder')
for i, best_experiment in enumerate(sorted_experiments[:1]):
for i, best_experiment in enumerate(sorted_experiments[:10]):
print(best_experiment)
print('Validation :')
print(best_experiment.get_best_validated_epoch())
Expand All @@ -68,7 +68,7 @@
if len(test_files) == 0:
print('No files in ', test_folder)
continue
if args.get('eval_only'):
if not args.get('eval_only'):
with tf.Graph().as_default(), tf.Session() as sess:
m = LoadedModel(model_folder, input_dict_key='filename')
for filename in tqdm(test_files, desc='Test images'):
Expand Down
9 changes: 7 additions & 2 deletions scripts/cBAD/cbad_process_set.py
Original file line number Diff line number Diff line change
Expand Up @@ -35,7 +35,7 @@ def predict_on_set(filenames_to_predict, model_dir, output_dir):
np.uint8(255 * pred))


def find_lines(img_filenames, dir_predictions, post_process_params, output_dir, debug=False):
def find_lines(img_filenames, dir_predictions, post_process_params, output_dir, debug=False, mask_dir: str=None):
"""
:param img_filenames:
Expand All @@ -51,8 +51,13 @@ def find_lines(img_filenames, dir_predictions, post_process_params, output_dir,

filename_pred = os.path.join(dir_predictions, basename + '.npy')
pred = np.load(filename_pred)
lines_prob = pred[:, :, 1]

contours, lines_mask = line_extraction_v1(pred[:, :, 1], **post_process_params)
if mask_dir is not None:
mask = imread(os.path.join(mask_dir, basename + '_bin.png'), mode='L')
lines_prob[mask == 0] = 0.

contours, lines_mask = line_extraction_v1(lines_prob, **post_process_params)
if debug:
imsave(os.path.join(output_dir, '{}_bin.jpg'.format(basename)), lines_mask)

Expand Down

0 comments on commit 2359a92

Please sign in to comment.