Source code for tensorbay.opendataset.AnimalPose.loader

#!/usr/bin/env python3
#
# Copyright 2021 Graviti. Licensed under MIT License.
#
# pylint: disable=invalid-name
# pylint: disable=missing-module-docstring

import json
import os
from typing import Iterable, Iterator, List, Tuple

from ...dataset import Data, Dataset
from ...exception import ModuleImportError
from ...geometry import Keypoint2D
from ...label import LabeledBox2D, LabeledKeypoints2D
from .._utility import glob

DATASET_NAME_5 = "AnimalPose5"
DATASET_NAME_7 = "AnimalPose7"

_KEYPOINT_TO_INDEX = {
    "L_Eye": 0,
    "R_Eye": 1,
    "Nose": 4,
    "L_EarBase": 2,
    "R_EarBase": 3,
    "Throat": 5,
    "L_F_Elbow": 8,
    "R_F_Elbow": 9,
    "L_F_Paw": 16,
    "R_F_Paw": 17,
    "Withers": 7,
    "TailBase": 6,
    "L_B_Paw": 18,
    "R_B_Paw": 19,
    "L_B_Elbow": 10,
    "R_B_Elbow": 11,
    "L_F_Knee": 12,
    "R_F_Knee": 13,
    "L_B_Knee": 14,
    "R_B_Knee": 15,
}


[docs]def AnimalPose5(path: str) -> Dataset: """Dataloader of the `5 Categories Animal-Pose`_ dataset. .. _5 Categories Animal-Pose: https://sites.google.com/view/animal-pose/ The file structure should be like:: <path> keypoint_image_part1/ cat/ 2007_000549.jpg 2007_000876.jpg ... ... PASCAL2011_animal_annotation/ cat/ 2007_000549_1.xml 2007_000876_1.xml 2007_000876_2.xml ... ... animalpose_image_part2/ cat/ ca1.jpeg ca2.jpeg ... ... animalpose_anno2/ cat/ ca1.xml ca2.xml ... Arguments: path: The root directory of the dataset. Returns: Loaded :class:`~tensorbay.dataset.dataset.Dataset` instance. """ root_path = os.path.abspath(os.path.expanduser(path)) dataset = Dataset(DATASET_NAME_5) dataset.load_catalog(os.path.join(os.path.dirname(__file__), "catalog_5.json")) animals = dataset.catalog.keypoints2d.categories.keys() for segment_name, _get_data in _DATA_GETTERS.items(): segment = dataset.create_segment(segment_name) for data in _get_data(root_path, animals): segment.append(data) return dataset
def _get_data_part1(root_path: str, aniamls: Iterable[str]) -> Iterator[Data]: try: import xmltodict # pylint: disable=import-outside-toplevel except ModuleNotFoundError as error: raise ModuleImportError(module_name=error.name) from error for animal in aniamls: for image_path in glob(os.path.join(root_path, "keypoint_image_part1", animal, "*.jpg")): data = Data(image_path, target_remote_path=f"{animal}/{os.path.basename(image_path)}") for annotation_path in glob( os.path.join( root_path, "PASCAL2011_animal_annotation", animal, f"{os.path.splitext(os.path.basename(image_path))[0]}_*.xml", ) ): with open(annotation_path, encoding="utf-8") as fp: labels = xmltodict.parse(fp.read()) box2d = labels["annotation"]["visible_bounds"] data.label.box2d = [ LabeledBox2D.from_xywh( x=float(box2d["@xmin"]), y=float(box2d["@ymin"]), width=float(box2d["@width"]), height=float(box2d["@height"]), category=animal, ) ] keypoints2d: List[Tuple[float, float, int]] = [()] * 20 # type: ignore[list-item] for keypoint in labels["annotation"]["keypoints"]["keypoint"]: keypoints2d[_KEYPOINT_TO_INDEX[keypoint["@name"]]] = ( float(keypoint["@x"]), float(keypoint["@y"]), int(keypoint["@visible"]), ) data.label.keypoints2d = [LabeledKeypoints2D(keypoints2d, category=animal)] yield data def _get_data_part2(root_path: str, aniamls: Iterable[str]) -> Iterator[Data]: try: import xmltodict # pylint: disable=import-outside-toplevel except ModuleNotFoundError as error: raise ModuleImportError(module_name=error.name) from error for animal in aniamls: for image_path in glob(os.path.join(root_path, "animalpose_image_part2", animal, "*.jpeg")): data = Data(image_path, target_remote_path=f"{animal}/{os.path.basename(image_path)}") annotation_path = os.path.join( root_path, "animalpose_anno2", animal, f"{os.path.splitext(os.path.basename(image_path))[0]}.xml", ) with open(annotation_path, encoding="utf-8") as fp: labels = xmltodict.parse(fp.read()) box2d = labels["annotation"]["visible_bounds"] data.label.box2d = [ LabeledBox2D.from_xywh( x=float(box2d["@xmin"]), y=float(box2d["@xmax"]), # xmax means ymin in the annotation width=float(box2d["@width"]), height=float(box2d["@height"]), category=animal, ) ] keypoints2d = LabeledKeypoints2D(category=animal) for keypoint in labels["annotation"]["keypoints"]["keypoint"]: keypoints2d.append( # pylint: disable=no-member Keypoint2D( float(keypoint["@x"]), float(keypoint["@y"]), int(keypoint["@visible"]) ) ) data.label.keypoints2d = [keypoints2d] yield data _DATA_GETTERS = {"part1": _get_data_part1, "part2": _get_data_part2}
[docs]def AnimalPose7(path: str) -> Dataset: """Dataloader of `7 Categories Animal-Pose`_ dataset. .. _7 Categories Animal-Pose: https://sites.google.com/view/animal-pose/ The file structure should be like:: <path> bndbox_image/ antelope/ Img-77.jpg ... ... bndbox_anno/ antelope.json ... Arguments: path: The root directory of the dataset. Returns: loaded :class:`~tensorbay.dataset.dataset.Dataset` object. """ root_path = os.path.abspath(os.path.expanduser(path)) dataset = Dataset(DATASET_NAME_7) dataset.load_catalog(os.path.join(os.path.dirname(__file__), "catalog_7.json")) segment = dataset.create_segment() for animal in dataset.catalog.box2d.categories.keys(): with open(os.path.join(root_path, "bndbox_anno", f"{animal}.json"), encoding="utf-8") as fp: annotations = json.load(fp) for image_name, box2ds in annotations.items(): image_path = os.path.join(root_path, "bndbox_image", animal, image_name) data = Data(image_path, target_remote_path=f"{animal}/{image_name}") data.label.box2d = [] for box2d in box2ds: coordinates = box2d["bndbox"] data.label.box2d.append( LabeledBox2D( float(coordinates["xmin"]), float(coordinates["ymin"]), float(coordinates["xmax"]), float(coordinates["ymax"]), category=animal, ) ) segment.append(data) return dataset