Skip to content

Commit

Permalink
fix: update conversion
Browse files Browse the repository at this point in the history
Signed-off-by: ktro2828 <[email protected]>
  • Loading branch information
ktro2828 committed Nov 27, 2024
1 parent 650bdf3 commit d96f426
Show file tree
Hide file tree
Showing 21 changed files with 528 additions and 50 deletions.
8 changes: 3 additions & 5 deletions config/update_t4_with_fastlabel_sample.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -14,11 +14,9 @@ description:
CAM_FRONT_LEFT: 5

conversion:
input_base: ./data/input/t4_format_2d_annotated # could be non_annotated_t4_format or t4_format_3d_annotated
input_base: ./data/input_t4_format # could be non_annotated_t4_format or t4_format_3d_annotated
input_anno_base: ./data/fastlabel
input_bag_base: ./data/rosbag2
output_base: ./data/output/t4_format_2d_annotated # this only includes the 2D annotations
topic_list: ./config/topic_list_sample.yaml
output_base: ./data/output_t4_format # currently, this only includes the 2D annotations
dataset_corresponding:
# input t4dataset_name: FastLabel json file name
DBv2.0-2-4: 2-4.json
T4DatasetName: FastLabelAnnotationFile
6 changes: 0 additions & 6 deletions perception_dataset/convert.py
Original file line number Diff line number Diff line change
Expand Up @@ -380,10 +380,6 @@ def main():
input_anno_base = config_dict["conversion"]["input_anno_base"]
dataset_corresponding = config_dict["conversion"]["dataset_corresponding"]
description = config_dict["description"]
input_bag_base = config_dict["conversion"]["input_bag_base"]
topic_list_yaml_path = config_dict["conversion"]["topic_list"]
with open(topic_list_yaml_path) as f:
topic_list_yaml = yaml.safe_load(f)

converter = FastLabel2dToUpdater(
input_base=input_base,
Expand All @@ -392,8 +388,6 @@ def main():
dataset_corresponding=dataset_corresponding,
overwrite_mode=args.overwrite,
description=description,
input_bag_base=input_bag_base,
topic_list=topic_list_yaml,
)
logger.info(
f"[BEGIN] Updating T4 dataset ({input_base}) with FastLabel {input_anno_base} into T4 data ({output_base})"
Expand Down
28 changes: 22 additions & 6 deletions perception_dataset/fastlabel_to_t4/fastlabel_2d_to_t4_updater.py
Original file line number Diff line number Diff line change
@@ -1,9 +1,10 @@
from __future__ import annotations

import json
import os.path as osp
from pathlib import Path
import shutil
from typing import Dict, List
from typing import Dict

from perception_dataset.fastlabel_to_t4.fastlabel_2d_to_t4_converter import (
FastLabel2dToT4Converter,
Expand All @@ -23,8 +24,6 @@ def __init__(
dataset_corresponding: Dict[str, int],
overwrite_mode: bool,
description: Dict[str, Dict[str, str]],
input_bag_base: str | None,
topic_list: Dict[str, List[str]] | List[str],
):
super().__init__(
input_base,
Expand All @@ -33,13 +32,13 @@ def __init__(
dataset_corresponding,
overwrite_mode,
description,
input_bag_base,
topic_list,
input_bag_base=None,
topic_list=None,
)

def convert(self) -> None:
anno_jsons_dict = self._load_annotation_jsons()
fl_annotations = self._format_deepen_annotation(anno_jsons_dict)
fl_annotations = self._format_fastlabel_annotation(anno_jsons_dict)

for t4dataset_name in self._t4dataset_name_to_merge:
# Check if input directory exists
Expand All @@ -53,9 +52,13 @@ def convert(self) -> None:
output_dir = self._output_base / t4dataset_name / "t4_dataset"
if self._input_bag_base is not None:
input_bag_dir = Path(self._input_bag_base) / t4dataset_name

if osp.exists(output_dir):
logger.error(f"{output_dir} already exists.")
is_dir_exist = True
else:
is_dir_exist = False

if self._overwrite_mode or not is_dir_exist:
# Remove existing output directory
shutil.rmtree(output_dir, ignore_errors=True)
Expand All @@ -78,3 +81,16 @@ def convert(self) -> None:
scene_anno_dict=fl_annotations[t4dataset_name],
dataset_name=t4dataset_name,
)

def _load_annotation_jsons(self):
anno_dict = {}
for file in self._input_anno_files:
t4_dataset_name = None
for name, ann_filename in self._t4dataset_name_to_merge.items():
if ann_filename == file.name:
t4_dataset_name = name

assert t4_dataset_name is not None
with open(file) as f:
anno_dict[t4_dataset_name] = json.load(f)
return anno_dict
82 changes: 69 additions & 13 deletions perception_dataset/t4_dataset/annotation_files_updater.py
Original file line number Diff line number Diff line change
@@ -1,10 +1,30 @@
import json
import os.path as osp
from typing import Any
from typing import Any, Dict

from perception_dataset.t4_dataset.annotation_files_generator import AnnotationFilesGenerator
from perception_dataset.t4_dataset.classes import (
AttributeTable,
CategoryTable,
InstanceTable,
ObjectAnnTable,
SampleAnnotationTable,
SurfaceAnnTable,
VisibilityTable,
)


def _load_json(filepath: str) -> Any:
with open(filepath) as f:
data = json.load(f)
return data


class AnnotationFilesUpdater(AnnotationFilesGenerator):
def __init__(self, with_camera: bool = True, description: Dict[str, Dict[str, str]] = ...):
super().__init__(with_camera, description)
self.description = description

def convert_one_scene(
self,
input_dir: str,
Expand All @@ -17,22 +37,58 @@ def convert_one_scene(
raise ValueError(f"Annotations files doesn't exist in {anno_dir}")

# Load existence annotation files
self._attribute_table.insert_from_json(osp.join(anno_dir, self._attribute_table.FILENAME))
self._category_table.insert_from_json(osp.join(anno_dir, self._category_table.FILENAME))
self._instance_table.insert_from_json(osp.join(anno_dir, self._instance_table.FILENAME))
self._sample_annotation_table.insert_from_json(
osp.join(anno_dir, self._sample_annotation_table.FILENAME)
)
self._object_ann_table.insert_from_json(
osp.join(anno_dir, self._object_ann_table.FILENAME)
)
self._surface_ann_table.insert_from_json(
osp.join(anno_dir, self._surface_ann_table.FILENAME)
)
self._init_table_from_json(anno_dir=anno_dir)

super().convert_one_scene(
input_dir=input_dir,
output_dir=output_dir,
scene_anno_dict=scene_anno_dict,
dataset_name=dataset_name,
)

def _init_table_from_json(self, anno_dir: str) -> None:
self._attribute_table = AttributeTable.from_json(
filepath=osp.join(anno_dir, AttributeTable.FILENAME),
name_to_description={},
default_value="",
)

self._category_table = CategoryTable.from_json(
filepath=osp.join(anno_dir, CategoryTable.FILENAME),
name_to_description={},
default_value="",
)

self._instance_table = InstanceTable.from_json(
filepath=osp.join(anno_dir, InstanceTable.FILENAME)
)

self._visibility_table = VisibilityTable.from_json(
filepath=osp.join(anno_dir, VisibilityTable.FILENAME),
level_to_description=self.description.get(
"visibility",
{
"v0-40": "visibility of whole object is between 0 and 40%",
"v40-60": "visibility of whole object is between 40 and 60%",
"v60-80": "visibility of whole object is between 60 and 80%",
"v80-100": "visibility of whole object is between 80 and 100%",
"none": "visibility isn't available",
},
),
default_value="",
)

if osp.exists(osp.join(anno_dir, SampleAnnotationTable.FILENAME)):
self._sample_annotation_table = SampleAnnotationTable.from_json(
osp.join(anno_dir, SampleAnnotationTable.FILENAME)
)

if osp.exists(osp.join(anno_dir, ObjectAnnTable.FILENAME)):
self._object_ann_table = ObjectAnnTable.from_json(
osp.join(anno_dir, ObjectAnnTable.FILENAME)
)

if osp.exists(osp.join(anno_dir, SurfaceAnnTable.FILENAME)):
self._surface_ann_table = SurfaceAnnTable.from_json(
osp.join(anno_dir, SurfaceAnnTable.FILENAME)
)
25 changes: 5 additions & 20 deletions perception_dataset/t4_dataset/classes/abstract_class.py
Original file line number Diff line number Diff line change
Expand Up @@ -24,9 +24,6 @@ def token(self, token: str):
def to_dict(self) -> Dict[str, Any]:
raise NotImplementedError()

def __eq__(self, value: T) -> bool:
return self.__dict__ == value.__dict__


T = TypeVar("T", bound=AbstractRecord)

Expand All @@ -46,10 +43,6 @@ def _to_record(self, **kwargs) -> T:
raise NotImplementedError()

def set_record_to_table(self, record: T):
same_tokens = [token for token, v in self._token_to_record.items() if v == record]
assert len(same_tokens) in (0, 1)
if len(same_tokens) == 1:
record.token = same_tokens[0] # overwrite record token with the existing one
self._token_to_record[record.token] = record

def insert_into_table(self, **kwargs) -> str:
Expand All @@ -60,19 +53,6 @@ def insert_into_table(self, **kwargs) -> str:
self.set_record_to_table(record)
return record.token

def insert_from_json(self, filepath: str):
with open(filepath, "r") as f:
table_data: List[Dict[str, Any]] = json.load(f)

for data in table_data:
token: str = data.pop("token")
record = self._to_record(**data)
record.token = token
assert isinstance(
record, AbstractRecord
), "_to_record function must return the instance of RecordClass"
self.set_record_to_table(record)

def select_record_from_token(self, token: str) -> T:
assert (
token in self._token_to_record
Expand All @@ -97,3 +77,8 @@ def save_json(self, output_dir: str):
table_data = self.to_data()
with open(osp.join(output_dir, self.FILENAME), "w") as f:
json.dump(table_data, f, indent=4)

@classmethod
@abstractmethod
def from_json(cls, filepath: str):
raise NotImplementedError
22 changes: 22 additions & 0 deletions perception_dataset/t4_dataset/classes/attribute.py
Original file line number Diff line number Diff line change
@@ -1,3 +1,6 @@
from __future__ import annotations

import json
from typing import Dict

from perception_dataset.constants import EXTENSION_ENUM
Expand Down Expand Up @@ -46,3 +49,22 @@ def get_token_from_name(self, name: str) -> str:
self._name_to_token[name] = token

return token

@classmethod
def from_json(
cls,
filepath: str,
name_to_description: Dict[str, str],
default_value: str,
) -> AttributeTable:
with open(filepath) as f:
items = json.load(f)

table = cls(name_to_description=name_to_description, default_value=default_value)

for item in items:
record = AttributeRecord(name=item["name"], description=item["description"])
record.token = item["token"]
table.set_record_to_table(record)

return table
31 changes: 31 additions & 0 deletions perception_dataset/t4_dataset/classes/calibrated_sensor.py
Original file line number Diff line number Diff line change
@@ -1,3 +1,6 @@
from __future__ import annotations

import json
from typing import Any, Dict, List

import numpy as np
Expand Down Expand Up @@ -58,3 +61,31 @@ def __init__(self):

def _to_record(self, **kwargs) -> CalibratedSensorRecord:
return CalibratedSensorRecord(**kwargs)

@classmethod
def from_json(cls, filepath: str) -> CalibratedSensorTable:
with open(filepath) as f:
items = json.load(f)

table = cls()
for item in items:
record = CalibratedSensorRecord(
sensor_token=item["sensor_token"],
translation={
"x": item["translation"][0],
"y": item["translation"][1],
"z": item["translation"][2],
},
rotation={
"w": item["rotation"][0],
"x": item["rotation"][1],
"y": item["rotation"][2],
"z": item["rotation"][3],
},
camera_intrinsic=item["camera_intrinsic"],
camera_distortion=item["camera_distortion"],
)
record.token = item["token"]
table.set_record_to_table(record)

return table
21 changes: 21 additions & 0 deletions perception_dataset/t4_dataset/classes/category.py
Original file line number Diff line number Diff line change
@@ -1,3 +1,6 @@
from __future__ import annotations

import json
from typing import Dict

from perception_dataset.constants import EXTENSION_ENUM
Expand Down Expand Up @@ -46,3 +49,21 @@ def get_token_from_name(self, name: str) -> str:
self._name_to_token[name] = token

return token

@classmethod
def from_json(
cls,
filepath: str,
name_to_description: Dict[str, str],
default_value: str,
) -> CategoryTable:
with open(filepath) as f:
items = json.load(f)

table = cls(name_to_description=name_to_description, default_value=default_value)
for item in items:
record = CategoryRecord(name=item["name"], description=item["description"])
record.token = item["token"]
table.set_record_to_table(record)

return table
Loading

0 comments on commit d96f426

Please sign in to comment.