|
6 | 6 | import os.path as osp
|
7 | 7 | import random
|
8 | 8 | from unittest import TestCase
|
| 9 | +from unittest.mock import MagicMock, patch |
9 | 10 |
|
10 | 11 | import numpy as np
|
11 | 12 | import pandas as pd
|
|
33 | 34 | Tabular,
|
34 | 35 | TabularCategories,
|
35 | 36 | )
|
36 |
| -from datumaro.components.dataset import Dataset |
| 37 | +from datumaro.components.dataset import Dataset, eager_mode |
37 | 38 | from datumaro.components.dataset_base import DatasetItem
|
38 | 39 | from datumaro.components.errors import AnnotationTypeError
|
39 |
| -from datumaro.components.media import Image, Table, TableRow |
| 40 | +from datumaro.components.media import Image, Table, TableRow, Video, VideoFrame |
40 | 41 |
|
41 | 42 | from ..requirements import Requirements, mark_bug, mark_requirement
|
42 | 43 |
|
@@ -420,26 +421,6 @@ def test_shapes_to_boxes(self):
|
420 | 421 | actual = transforms.ShapesToBoxes(source_dataset)
|
421 | 422 | compare_datasets(self, target_dataset, actual)
|
422 | 423 |
|
423 |
| - @mark_requirement(Requirements.DATUM_GENERAL_REQ) |
424 |
| - def test_id_from_image(self): |
425 |
| - source_dataset = Dataset.from_iterable( |
426 |
| - [ |
427 |
| - DatasetItem(id=1, media=Image.from_file(path="path.jpg")), |
428 |
| - DatasetItem(id=2), |
429 |
| - DatasetItem(id=3, media=Image.from_numpy(data=np.ones([5, 5, 3]))), |
430 |
| - ] |
431 |
| - ) |
432 |
| - target_dataset = Dataset.from_iterable( |
433 |
| - [ |
434 |
| - DatasetItem(id="path", media=Image.from_file(path="path.jpg")), |
435 |
| - DatasetItem(id=2), |
436 |
| - DatasetItem(id=3, media=Image.from_numpy(data=np.ones([5, 5, 3]))), |
437 |
| - ] |
438 |
| - ) |
439 |
| - |
440 |
| - actual = transforms.IdFromImageName(source_dataset) |
441 |
| - compare_datasets(self, target_dataset, actual) |
442 |
| - |
443 | 424 | @mark_requirement(Requirements.DATUM_GENERAL_REQ)
|
444 | 425 | def test_boxes_to_masks(self):
|
445 | 426 | source_dataset = Dataset.from_iterable(
|
@@ -1227,6 +1208,84 @@ def test_annotation_reindex(self, fxt_dataset: Dataset, reindex_each_item: bool)
|
1227 | 1208 | )
|
1228 | 1209 |
|
1229 | 1210 |
|
| 1211 | +class IdFromImageNameTest: |
| 1212 | + @pytest.fixture |
| 1213 | + def fxt_dataset(self, n_labels=3, n_anns=5, n_items=7) -> Dataset: |
| 1214 | + video = Video("video.mp4") |
| 1215 | + video._frame_size = MagicMock(return_value=(32, 32)) |
| 1216 | + video.get_frame_data = MagicMock(return_value=np.ndarray((32, 32, 3), dtype=np.uint8)) |
| 1217 | + return Dataset.from_iterable( |
| 1218 | + [ |
| 1219 | + DatasetItem(id=1, media=Image.from_file(path="path1.jpg")), |
| 1220 | + DatasetItem(id=2, media=Image.from_file(path="path1.jpg")), |
| 1221 | + DatasetItem(id=3, media=Image.from_file(path="path1.jpg")), |
| 1222 | + DatasetItem(id=4, media=VideoFrame(video, index=30)), |
| 1223 | + DatasetItem(id=5, media=VideoFrame(video, index=30)), |
| 1224 | + DatasetItem(id=6, media=VideoFrame(video, index=60)), |
| 1225 | + DatasetItem(id=7), |
| 1226 | + DatasetItem(id=8, media=Image.from_numpy(data=np.ones([5, 5, 3]))), |
| 1227 | + ] |
| 1228 | + ) |
| 1229 | + |
| 1230 | + @mark_requirement(Requirements.DATUM_GENERAL_REQ) |
| 1231 | + @pytest.mark.parametrize("ensure_unique", [True, False]) |
| 1232 | + def test_id_from_image(self, fxt_dataset, ensure_unique): |
| 1233 | + source_dataset: Dataset = fxt_dataset |
| 1234 | + actual_dataset = transforms.IdFromImageName(source_dataset, ensure_unique=ensure_unique) |
| 1235 | + |
| 1236 | + unique_names: set[str] = set() |
| 1237 | + for src, actual in zip(source_dataset, actual_dataset): |
| 1238 | + if not isinstance(src.media, Image) or not hasattr(src.media, "path"): |
| 1239 | + src == actual |
| 1240 | + else: |
| 1241 | + if isinstance(src.media, VideoFrame): |
| 1242 | + expected_id = f"video_frame-{src.media.index}" |
| 1243 | + else: |
| 1244 | + expected_id = os.path.splitext(src.media.path)[0] |
| 1245 | + if ensure_unique: |
| 1246 | + assert actual.id.startswith(expected_id) |
| 1247 | + assert actual.wrap(id=src.id) == src |
| 1248 | + assert actual.id not in unique_names |
| 1249 | + unique_names.add(actual.id) |
| 1250 | + else: |
| 1251 | + assert src.wrap(id=expected_id) == actual |
| 1252 | + |
| 1253 | + @mark_requirement(Requirements.DATUM_GENERAL_REQ) |
| 1254 | + def test_id_from_image_wrong_suffix_length(self, fxt_dataset): |
| 1255 | + with pytest.raises(ValueError) as e: |
| 1256 | + transforms.IdFromImageName(fxt_dataset, ensure_unique=True, suffix_length=0) |
| 1257 | + assert str(e.value).startswith("The 'suffix_length' must be greater than 0.") |
| 1258 | + |
| 1259 | + @mark_requirement(Requirements.DATUM_GENERAL_REQ) |
| 1260 | + def test_id_from_image_too_many_duplication(self, fxt_dataset): |
| 1261 | + with patch("datumaro.plugins.transforms.IdFromImageName.DEFAULT_RETRY", 1), patch( |
| 1262 | + "datumaro.plugins.transforms.IdFromImageName.SUFFIX_LETTERS", "a" |
| 1263 | + ), pytest.raises(Exception) as e: |
| 1264 | + with eager_mode(): |
| 1265 | + fxt_dataset.transform( |
| 1266 | + "id_from_image_name", |
| 1267 | + ensure_unique=True, |
| 1268 | + suffix_length=1, |
| 1269 | + ) |
| 1270 | + assert str(e.value).startswith("Too many duplicate names.") |
| 1271 | + |
| 1272 | + @mark_requirement(Requirements.DATUM_GENERAL_REQ) |
| 1273 | + @pytest.mark.parametrize( |
| 1274 | + "args,ensure_unique,suffix_length", |
| 1275 | + [ |
| 1276 | + ([], False, 3), |
| 1277 | + (["--ensure_unique", "--suffix_length", "2"], True, 2), |
| 1278 | + ], |
| 1279 | + ids=["default", "ensure_unique"], |
| 1280 | + ) |
| 1281 | + def test_parser(self, args, ensure_unique, suffix_length): |
| 1282 | + parser = transforms.IdFromImageName.build_cmdline_parser() |
| 1283 | + args = parser.parse_args(args) |
| 1284 | + |
| 1285 | + assert hasattr(args, "ensure_unique") and args.ensure_unique == ensure_unique |
| 1286 | + assert hasattr(args, "suffix_length") and args.suffix_length == suffix_length |
| 1287 | + |
| 1288 | + |
1230 | 1289 | class AstypeAnnotationsTest(TestCase):
|
1231 | 1290 | def setUp(self):
|
1232 | 1291 | self.table = Table.from_list(
|
|
0 commit comments