-
Notifications
You must be signed in to change notification settings - Fork 4
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
feat(convert): add annotated_t4_to_deepen (#57)
* feat(convert): add annotated_t4_to_deepen Signed-off-by: kminoda <[email protected]> * [pre-commit.ci] auto fixes from pre-commit.com hooks for more information, see https://pre-commit.ci * fix: update default config Signed-off-by: kminoda <[email protected]> * fix: update default config Signed-off-by: kminoda <[email protected]> * feat: update readme Signed-off-by: kminoda <[email protected]> * fix: rename t4 to non_annotated_t4 Signed-off-by: kminoda <[email protected]> * fix: fix docs Signed-off-by: kminoda <[email protected]> * [pre-commit.ci] auto fixes from pre-commit.com hooks for more information, see https://pre-commit.ci * fix: change default label_only value Signed-off-by: kminoda <[email protected]> * Update docs/tools_overview.md Co-authored-by: Shunsuke Miura <[email protected]> --------- Signed-off-by: kminoda <[email protected]> Co-authored-by: pre-commit-ci[bot] <66853113+pre-commit-ci[bot]@users.noreply.github.com> Co-authored-by: Shunsuke Miura <[email protected]>
- Loading branch information
1 parent
df60a1c
commit 9c88581
Showing
7 changed files
with
315 additions
and
8 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,21 @@ | ||
task: convert_annotated_t4_to_deepen | ||
conversion: | ||
input_base: ./data/annotated_t4_format | ||
output_base: ./data/deepen_format | ||
annotation_hz: 10 | ||
workers_number: 12 | ||
label_only: False | ||
camera_sensors: | ||
- channel: CAM_FRONT | ||
- channel: CAM_FRONT_RIGHT | ||
- channel: CAM_BACK_RIGHT | ||
- channel: CAM_BACK | ||
- channel: CAM_BACK_LEFT | ||
- channel: CAM_FRONT_LEFT | ||
camera_position: | ||
CAM_FRONT: camera_0 | ||
CAM_FRONT_RIGHT: camera_1 | ||
CAM_BACK_RIGHT: camera_2 | ||
CAM_BACK: camera_3 | ||
CAM_BACK_LEFT: camera_4 | ||
CAM_FRONT_LEFT: camera_5 |
2 changes: 1 addition & 1 deletion
2
config/convert_t4_to_deepen_sample.yaml → ...rt_non_annotated_t4_to_deepen_sample.yaml
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
233 changes: 233 additions & 0 deletions
233
perception_dataset/deepen/annotated_t4_to_deepen_converter.py
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,233 @@ | ||
import glob | ||
import json | ||
import os | ||
import os.path as osp | ||
import time | ||
from typing import Any, Dict, List | ||
|
||
from nuimages import NuImages | ||
import numpy as np | ||
from nuscenes.nuscenes import NuScenes | ||
from nuscenes.utils.geometry_utils import transform_matrix | ||
from pyquaternion import Quaternion | ||
|
||
from perception_dataset.abstract_converter import AbstractConverter | ||
from perception_dataset.constants import LABEL_PATH_ENUM | ||
from perception_dataset.utils.label_converter import LabelConverter | ||
from perception_dataset.utils.logger import configure_logger | ||
|
||
logger = configure_logger(modname=__name__) | ||
|
||
|
||
class AnnotatedT4ToDeepenConverter(AbstractConverter): | ||
def __init__(self, input_base: str, output_base: str, camera_position: Dict): | ||
super().__init__(input_base, output_base) | ||
self._camera_position = camera_position | ||
self._label_converter = LabelConverter( | ||
label_path=LABEL_PATH_ENUM.OBJECT_LABEL, | ||
attribute_path=LABEL_PATH_ENUM.ATTRIBUTE, | ||
) | ||
|
||
def convert(self): | ||
start_time = time.time() | ||
|
||
for scene_dir in glob.glob(osp.join(self._input_base, "*")): | ||
if not osp.isdir(scene_dir): | ||
continue | ||
t4_dataset_path = osp.join(scene_dir, "t4_dataset") | ||
if not osp.isdir(t4_dataset_path): | ||
t4_dataset_path = scene_dir | ||
|
||
scene_name = osp.basename(scene_dir) | ||
self._convert_one_scene( | ||
t4_dataset_path, | ||
scene_name, | ||
) | ||
|
||
elapsed_time = time.time() - start_time | ||
logger.info(f"Elapsed time: {elapsed_time:.1f} [sec]") | ||
|
||
def _convert_one_scene(self, input_dir: str, scene_name: str): | ||
output_dir = self._output_base | ||
os.makedirs(output_dir, exist_ok=True) | ||
nusc = NuScenes(version="annotation", dataroot=input_dir, verbose=False) | ||
nuim = NuImages(version="annotation", dataroot=input_dir, verbose=True, lazy=True) | ||
|
||
logger.info(f"Converting {input_dir} to {output_dir}") | ||
output_label: List = [] | ||
|
||
for frame_index, sample_record in enumerate(nusc.sample): | ||
sample_token = sample_record["token"] | ||
logger.info(f"sample_token: {sample_token}") | ||
for anno_token in sample_record["anns"]: | ||
current_label_dict: Dict = {} | ||
current_label_dict["attributes_source"] = {} | ||
current_label_dict["create_time_millis"] = "null" | ||
current_label_dict["update_time_millis"] = "null" | ||
current_label_dict["dataset_id"] = "" | ||
current_label_dict["labeller_email"] = "[email protected]" | ||
current_label_dict["user_id"] = "[email protected]" | ||
current_label_dict["version"] = "null" | ||
current_label_dict["label_set_id"] = "default" | ||
current_label_dict["stage_id"] = "Labelling" | ||
anno = nusc.get("sample_annotation", anno_token) | ||
|
||
instance_record = nusc.get("instance", anno["instance_token"]) | ||
instance_index = nusc.getind("instance", anno["instance_token"]) + 1 | ||
category_record = nusc.get("category", instance_record["category_token"]) | ||
visibility_record = nusc.get("visibility", anno["visibility_token"]) | ||
|
||
for sensor, token in sample_record["data"].items(): | ||
if "LIDAR" in sensor: | ||
break | ||
|
||
sample_data_record = nusc.get("sample_data", sample_record["data"][sensor]) | ||
file_id = osp.basename(sample_data_record["filename"]).replace(".pcd.bin", ".pcd") | ||
label_category_id = self._label_converter.convert_label(category_record["name"]) | ||
|
||
attributes_records = [ | ||
nusc.get("attribute", token) for token in anno["attribute_tokens"] | ||
] | ||
attributes_name = [ | ||
self._label_converter.convert_attribute(v["name"]) for v in attributes_records | ||
] | ||
attributes = {v[0 : v.find(".")]: v[v.find(".") + 1 :] for v in attributes_name} | ||
if "occlusion_state" not in attributes: | ||
attributes["occlusion_state"] = self._convert_to_visibility_occulusion( | ||
visibility_record["level"] | ||
) | ||
|
||
three_d_bbox = { | ||
"cx": anno["translation"][0], | ||
"cy": anno["translation"][1], | ||
"cz": anno["translation"][2], | ||
"h": anno["size"][2], | ||
"l": anno["size"][1], | ||
"w": anno["size"][0], | ||
"quaternion": { | ||
"x": anno["rotation"][1], | ||
"y": anno["rotation"][2], | ||
"z": anno["rotation"][3], | ||
"w": anno["rotation"][0], | ||
}, | ||
} | ||
current_label_dict["three_d_bbox"] = three_d_bbox | ||
sensor_id = "lidar" | ||
label_type = "3d_bbox" | ||
|
||
current_label_dict["attributes"] = attributes | ||
current_label_dict["file_id"] = file_id | ||
current_label_dict["label_category_id"] = label_category_id | ||
current_label_dict["label_id"] = f"{label_category_id}:{instance_index}" | ||
current_label_dict["sensor_id"] = sensor_id | ||
current_label_dict["label_type"] = label_type | ||
|
||
output_label.append(current_label_dict) | ||
print(f"{label_category_id}:{instance_index}") | ||
|
||
if osp.exists(osp.join(input_dir, "annotation", "object_ann.json")): | ||
for frame_index, sample_record in enumerate(nusc.sample): | ||
for cam, sensor_id in self._camera_position.items(): | ||
if cam not in sample_record["data"]: | ||
continue | ||
sample_camera_token = sample_record["data"][cam] | ||
print(f"cam:{cam}, sample_camera_token: {sample_camera_token}") | ||
object_anns = [ | ||
o for o in nuim.object_ann if o["sample_data_token"] == sample_camera_token | ||
] | ||
|
||
for ann in object_anns: | ||
current_label_dict: Dict = {} | ||
category_token = ann["category_token"] | ||
category_record = nuim.get("category", category_token) | ||
bbox = ann["bbox"] | ||
bbox[2] = bbox[2] - bbox[0] | ||
bbox[3] = bbox[3] - bbox[1] | ||
label_type = "box" | ||
current_label_dict["box"] = bbox | ||
|
||
label_category_id = self._label_converter.convert_label( | ||
category_record["name"] | ||
) | ||
try: | ||
instance_index = nusc.getind("instance", ann["instance_token"]) + 1 | ||
attributes_records = [ | ||
nusc.get("attribute", token) for token in ann["attribute_tokens"] | ||
] | ||
attributes_name = [ | ||
self._label_converter.convert_attribute(v["name"]) | ||
for v in attributes_records | ||
] | ||
attributes = { | ||
v[0 : v.find(".")]: v[v.find(".") + 1 :] for v in attributes_name | ||
} | ||
|
||
current_label_dict["attributes"] = attributes | ||
current_label_dict["create_time_millis"] = "null" | ||
current_label_dict["update_time_millis"] = "null" | ||
current_label_dict["dataset_id"] = "" | ||
current_label_dict["labeller_email"] = "[email protected]" | ||
current_label_dict["user_id"] = "[email protected]" | ||
current_label_dict["version"] = "null" | ||
current_label_dict["label_set_id"] = "default" | ||
current_label_dict["stage_id"] = "Labelling" | ||
current_label_dict["file_id"] = f"{frame_index}.pcd" | ||
current_label_dict["label_category_id"] = label_category_id | ||
current_label_dict[ | ||
"label_id" | ||
] = f"{label_category_id}:{instance_index}" | ||
current_label_dict["sensor_id"] = sensor_id | ||
current_label_dict["label_type"] = label_type | ||
|
||
output_label.append(current_label_dict) | ||
print(f"{label_category_id}:{instance_index}") | ||
except KeyError: | ||
instance_id = ann["instance_token"] | ||
print(f"There is no instance_id:{instance_id}") | ||
|
||
output_json = {"labels": output_label} | ||
with open(osp.join(output_dir, f"{scene_name}.json"), "w") as f: | ||
json.dump(output_json, f, indent=4) | ||
|
||
logger.info(f"Done Conversion: {input_dir} to {output_dir}") | ||
|
||
def _get_data(self, nusc: NuScenes, sensor_channel_token: str) -> Dict[str, Any]: | ||
sd_record = nusc.get("sample_data", sensor_channel_token) | ||
cs_record = nusc.get("calibrated_sensor", sd_record["calibrated_sensor_token"]) | ||
ep_record = nusc.get("ego_pose", sd_record["ego_pose_token"]) | ||
|
||
sensor2ego_transform = transform_matrix( | ||
translation=cs_record["translation"], | ||
rotation=Quaternion(cs_record["rotation"]), | ||
) | ||
ego2global_transform = transform_matrix( | ||
translation=ep_record["translation"], | ||
rotation=Quaternion(ep_record["rotation"]), | ||
) | ||
|
||
sensor2global_transform = ego2global_transform @ sensor2ego_transform | ||
sensor2global_translation = sensor2global_transform[:3, 3] | ||
sensor2global_rotation = np.array(list(Quaternion(matrix=sensor2global_transform[:3, :3]))) | ||
|
||
ret_dict = { | ||
"fileformat": sd_record["fileformat"], | ||
"unix_timestamp": self._timestamp_to_sec(sd_record["timestamp"]), | ||
"sensor2global_transform": sensor2global_transform, | ||
"sensor2global_translation": sensor2global_translation, | ||
"sensor2global_rotation": sensor2global_rotation, | ||
} | ||
|
||
return ret_dict | ||
|
||
def _timestamp_to_sec(self, timestamp: int) -> float: | ||
return float(timestamp) * 1e-6 | ||
|
||
def _convert_to_visibility_occulusion(self, name: str) -> str: | ||
if name == "none": | ||
return "full" | ||
elif name == "most": | ||
return "partial" | ||
elif name == "partial": | ||
return "most" | ||
else: | ||
return "none" |
2 changes: 1 addition & 1 deletion
2
tests/config/convert_t4_to_deepen.yaml → ...g/convert_non_annotated_t4_to_deepen.yaml
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters