Skip to content

Commit

Permalink
[datasets] revert whitespace filtering and fix svhn reco (#987)
Browse files Browse the repository at this point in the history
  • Loading branch information
felixdittrich92 committed Jul 20, 2022
1 parent bb24e3f commit 739943a
Show file tree
Hide file tree
Showing 6 changed files with 9 additions and 10 deletions.
4 changes: 2 additions & 2 deletions .github/workflows/references.yml
Original file line number Diff line number Diff line change
Expand Up @@ -153,10 +153,10 @@ jobs:
pip install -e .[torch] --upgrade
- if: matrix.framework == 'tensorflow'
name: Evaluate text recognition (TF)
run: python references/recognition/evaluate_tensorflow.py crnn_mobilenet_v3_small --dataset IIIT5K
run: python references/recognition/evaluate_tensorflow.py crnn_mobilenet_v3_small --dataset IIIT5K -b 32
- if: matrix.framework == 'pytorch'
name: Evaluate text recognition (PT)
run: python references/recognition/evaluate_pytorch.py crnn_mobilenet_v3_small --dataset IIIT5K
run: python references/recognition/evaluate_pytorch.py crnn_mobilenet_v3_small --dataset IIIT5K -b 32

latency-text-recognition:
runs-on: ${{ matrix.os }}
Expand Down
4 changes: 1 addition & 3 deletions doctr/datasets/cord.py
Original file line number Diff line number Diff line change
Expand Up @@ -97,9 +97,7 @@ def __init__(
crops = crop_bboxes_from_image(img_path=os.path.join(tmp_root, img_path),
geoms=np.asarray(box_targets, dtype=int).clip(min=0))
for crop, label in zip(crops, list(text_targets)):
# filter labels with whitespaces
if ' ' not in label:
self.data.append((crop, dict(labels=[label])))
self.data.append((crop, dict(labels=[label])))
else:
self.data.append((
img_path,
Expand Down
4 changes: 2 additions & 2 deletions doctr/datasets/funsd.py
Original file line number Diff line number Diff line change
Expand Up @@ -91,8 +91,8 @@ def __init__(
crops = crop_bboxes_from_image(img_path=os.path.join(tmp_root, img_path),
geoms=np.asarray(box_targets, dtype=np_dtype))
for crop, label in zip(crops, list(text_targets)):
# filter labels with non utf-8 characters and whitespaces
if not any(char in label for char in [' ', '☑', '☐', '\uf703', '\uf702']):
# filter labels with unknown characters
if not any(char in label for char in ['☑', '☐', '\uf703', '\uf702']):
self.data.append((crop, dict(labels=[label])))
else:
self.data.append((
Expand Down
3 changes: 2 additions & 1 deletion doctr/datasets/svhn.py
Original file line number Diff line number Diff line change
Expand Up @@ -114,7 +114,8 @@ def __init__(
if recognition_task:
crops = crop_bboxes_from_image(img_path=os.path.join(tmp_root, img_name), geoms=box_targets)
for crop, label in zip(crops, label_targets):
self.data.append((crop, dict(labels=[label])))
if crop.shape[0] > 0 and crop.shape[1] > 0 and len(label) > 0:
self.data.append((crop, dict(labels=[label])))
else:
self.data.append((img_name, dict(boxes=box_targets, labels=label_targets)))

Expand Down
2 changes: 1 addition & 1 deletion references/recognition/evaluate_pytorch.py
Original file line number Diff line number Diff line change
Expand Up @@ -146,7 +146,7 @@ def parse_args():
parser.add_argument('--vocab', type=str, default="french", help='Vocab to be used for evaluation')
parser.add_argument('--dataset', type=str, default="FUNSD", help='Dataset to evaluate on')
parser.add_argument('--device', default=None, type=int, help='device')
parser.add_argument('-b', '--batch_size', type=int, default=32, help='batch size for evaluation')
parser.add_argument('-b', '--batch_size', type=int, default=1, help='batch size for evaluation')
parser.add_argument('--input_size', type=int, default=32, help='input size H for the model, W = 4*H')
parser.add_argument('-j', '--workers', type=int, default=None, help='number of workers used for dataloading')
parser.add_argument('--only_regular', dest='regular', action='store_true',
Expand Down
2 changes: 1 addition & 1 deletion references/recognition/evaluate_tensorflow.py
Original file line number Diff line number Diff line change
Expand Up @@ -124,7 +124,7 @@ def parse_args():
parser.add_argument('arch', type=str, help='text-recognition model to evaluate')
parser.add_argument('--vocab', type=str, default="french", help='Vocab to be used for evaluation')
parser.add_argument('--dataset', type=str, default="FUNSD", help='Dataset to evaluate on')
parser.add_argument('-b', '--batch_size', type=int, default=32, help='batch size for evaluation')
parser.add_argument('-b', '--batch_size', type=int, default=1, help='batch size for evaluation')
parser.add_argument('--input_size', type=int, default=32, help='input size H for the model, W = 4*H')
parser.add_argument('-j', '--workers', type=int, default=None, help='number of workers used for dataloading')
parser.add_argument('--only_regular', dest='regular', action='store_true',
Expand Down

0 comments on commit 739943a

Please sign in to comment.