[Datumaro] Add dataset examples (#1640)

* add dataset examples
main
zhiltsov-max 6 years ago committed by GitHub
parent da3fa34ce0
commit d1b2960b3d
No known key found for this signature in database
GPG Key ID: 4AEE18F83AFDEB23

@ -32,15 +32,26 @@ VOC-like dataset -- ---> Publication etc.
- Dataset format conversions:
- COCO (`image_info`, `instances`, `person_keypoints`, `captions`, `labels`*)
- [Format specification](http://cocodataset.org/#format-data)
- [Dataset example](tests/assets/coco_dataset)
- `labels` are our extension - like `instances` with only `category_id`
- PASCAL VOC (`classification`, `detection`, `segmentation` (class, instances), `action_classification`, `person_layout`)
- [Format specification](http://host.robots.ox.ac.uk/pascal/VOC/voc2012/htmldoc/index.html)
- [Dataset example](tests/assets/voc_dataset)
- YOLO (`bboxes`)
- [Format specification](https://github.com/AlexeyAB/darknet#how-to-train-pascal-voc-data)
- [Dataset example](tests/assets/yolo_dataset)
- TF Detection API (`bboxes`, `masks`)
- Format specifications: [bboxes](https://github.com/tensorflow/models/blob/master/research/object_detection/g3doc/using_your_own_dataset.md), [masks](https://github.com/tensorflow/models/blob/master/research/object_detection/g3doc/instance_segmentation.md)
- [Dataset example](tests/assets/tf_detection_api_dataset)
- MOT sequences
- [Format specification](https://arxiv.org/pdf/1906.04567.pdf)
- [Dataset example](tests/assets/mot_dataset)
- CVAT
- [Format specification](https://github.com/opencv/cvat/blob/develop/cvat/apps/documentation/xml_format.md)
- [Dataset example](tests/assets/cvat_dataset)
- LabelMe
- [Format specification](http://labelme.csail.mit.edu/Release3.0)
- [Dataset example](tests/assets/labelme_dataset)
- Dataset building operations:
- Merging multiple datasets into one
- Dataset filtering with custom conditions, for instance:
@ -52,7 +63,7 @@ VOC-like dataset -- ---> Publication etc.
- Annotation conversions, for instance
- polygons to instance masks and vise-versa
- apply a custom colormap for mask annotations
- remap dataset labels
- rename or remove dataset labels
- Dataset comparison
- Model integration:
- Inference (OpenVINO and custom models)

@ -0,0 +1,59 @@
{
"licenses": [
{
"name": "",
"id": 0,
"url": ""
}
],
"info": {
"contributor": "",
"date_created": "",
"description": "",
"url": "",
"version": "",
"year": ""
},
"categories": [
{
"id": 1,
"name": "TEST",
"supercategory": ""
}
],
"images": [
{
"id": 1,
"width": 5,
"height": 10,
"file_name": "000000000001.jpg",
"license": 0,
"flickr_url": "",
"coco_url": "",
"date_captured": 0
}
],
"annotations": [
{
"id": 1,
"image_id": 1,
"category_id": 1,
"segmentation": [[0, 0, 1, 0, 1, 2, 0, 2]],
"area": 2,
"bbox": [0, 0, 1, 2],
"iscrowd": 0
},
{
"id": 2,
"image_id": 1,
"category_id": 1,
"segmentation": {
"counts": [0, 10, 5, 5, 5, 5, 0, 10, 10, 0],
"size": [10, 5]
},
"area": 30,
"bbox": [0, 0, 10, 4],
"iscrowd": 1
}
]
}

Binary file not shown.

After

Width:  |  Height:  |  Size: 631 B

Binary file not shown.

After

Width:  |  Height:  |  Size: 631 B

Binary file not shown.

After

Width:  |  Height:  |  Size: 631 B

@ -0,0 +1,45 @@
<annotations>
<version>1.1</version>
<meta>
<task>
<z_order>True</z_order>
<mode>annotation</mode>
<labels>
<label>
<name>label1</name>
<attributes>
<attribute>
<name>a1</name>
<input_type>checkbox</input_type>
<default_value>false</default_value>
<values>false
true</values>
</attribute>
<attribute>
<name>a2</name>
<input_type>radio</input_type>
<default_value>v1</default_value>
<values>v1
v2
v3</values>
</attribute>
</attributes>
</label>
<label>
<name>label2</name>
</label>
</labels>
</task>
</meta>
<image height="8" id="0" name="img0.jpg" width="8">
<box label="label1" occluded="1" xbr="4" xtl="0" ybr="4" ytl="2" z_order="1">
<attribute name="a1">true</attribute>
<attribute name="a2">v3</attribute>
</box>
<polyline label="" points="1.0,2;3,4;5,6;7,8"/>
</image>
<image height="10" id="1" name="img1.jpg" width="10">
<polygon label="" points="1,2;3,4;6,5" z_order="1"/>
<points label="label2" points="1,2;3,4;5,6" z_order="2"/>
</image>
</annotations>

@ -0,0 +1,92 @@
<?xml version="1.0" encoding="utf-8"?>
<annotations>
<version>1.1</version>
<meta>
<task>
<id>5</id>
<name>v1</name>
<size>4</size>
<mode>interpolation</mode>
<overlap>2</overlap>
<bugtracker></bugtracker>
<created>2020-04-23 08:57:24.614217+00:00</created>
<updated>2020-04-23 09:04:48.168008+00:00</updated>
<start_frame>10</start_frame>
<stop_frame>19</stop_frame>
<frame_filter>step=3</frame_filter>
<z_order>True</z_order>
<labels>
<label>
<name>klhg</name>
<attributes>
<attribute>
<name>hgl</name>
<mutable>True</mutable>
<input_type>select</input_type>
<default_value>jk</default_value>
<values>jk
hgkf</values>
</attribute>
</attributes>
</label>
<label>
<name>z U k</name>
<attributes>
</attributes>
</label>
<label>
<name>II</name>
<attributes>
</attributes>
</label>
</labels>
<segments>
<segment>
<id>3</id>
<start>0</start>
<stop>3</stop>
<url>http://localhost:7000/?id=3</url>
</segment>
<segment>
<id>4</id>
<start>2</start>
<stop>3</stop>
<url>http://localhost:7000/?id=4</url>
</segment>
</segments>
<owner>
<username>max</username>
<email></email>
</owner>
<assignee></assignee>
<original_size>
<width>25</width>
<height>20</height>
</original_size>
</task>
<dumped>2020-04-23 09:05:02.335612+00:00</dumped>
<source>t.mp4</source>
</meta>
<track id="0" label="II">
<box frame="10" outside="0" occluded="1" keyframe="1" xtl="3.00" ytl="4.00" xbr="10.00" ybr="5.00" z_order="0">
</box>
<box frame="13" outside="1" occluded="0" keyframe="1" xtl="7.00" ytl="6.00" xbr="14.00" ybr="8.00" z_order="0">
</box>
<box frame="16" outside="1" occluded="0" keyframe="1" xtl="8.00" ytl="7.00" xbr="14.0" ybr="17.00" z_order="0">
</box>
</track>
<track id="1" label="klhg">
<points frame="10" outside="0" occluded="0" keyframe="1" points="21.95,8.00;2.55,15.09;2.23,3.16" z_order="0">
<attribute name="hgl">hgkf</attribute>
</points>
<points frame="13" outside="1" occluded="0" keyframe="1" points="21.95,8.00;9.55,15.09;5.23,1.16" z_order="0">
<attribute name="hgl">jk</attribute>
</points>
</track>
<track id="2" label="II">
<polyline frame="13" outside="0" occluded="0" keyframe="1" points="7.85,13.88;3.50,6.67;15.90,2.00;13.31,7.21" z_order="0">
</polyline>
<polyline frame="16" outside="1" occluded="0" keyframe="1" points="7.85,13.88;3.50,6.67;15.90,2.00;13.31,7.21" z_order="0">
</polyline>
</track>
</annotations>

Binary file not shown.

After

Width:  |  Height:  |  Size: 111 B

Binary file not shown.

After

Width:  |  Height:  |  Size: 111 B

@ -0,0 +1,10 @@
label_0
label_1
label_2
label_3
label_4
label_5
label_6
label_7
label_8
label_9

Binary file not shown.

After

Width:  |  Height:  |  Size: 631 B

@ -0,0 +1,50 @@
item {
id: 1
name: 'label_0'
}
item {
id: 2
name: 'label_1'
}
item {
id: 3
name: 'label_2'
}
item {
id: 4
name: 'label_3'
}
item {
id: 5
name: 'label_4'
}
item {
id: 6
name: 'label_5'
}
item {
id: 7
name: 'label_6'
}
item {
id: 8
name: 'label_7'
}
item {
id: 9
name: 'label_8'
}
item {
id: 10
name: 'label_9'
}

@ -0,0 +1,54 @@
<?xml version="1.0" encoding="UTF-8"?>
<annotation>
<folder>VOC2007</folder>
<filename>2007_000001.jpg</filename>
<size>
<width>10</width>
<height>20</height>
<depth>3</depth>
</size>
<segmented>1</segmented>
<object>
<name>cat</name>
<pose>Unspecified</pose>
<truncated>1</truncated>
<difficult>0</difficult>
<bndbox>
<xmin>1</xmin>
<ymin>2</ymin>
<xmax>3</xmax>
<ymax>4</ymax>
</bndbox>
</object>
<object>
<name>person</name>
<bndbox>
<xmin>4</xmin>
<ymin>5</ymin>
<xmax>6</xmax>
<ymax>7</ymax>
</bndbox>
<part>
<name>head</name>
<bndbox>
<xmin>5.5</xmin>
<ymin>6</ymin>
<xmax>7.5</xmax>
<ymax>8</ymax>
</bndbox>
</part>
<actions>
<other>1</other>
<jumping>0</jumping>
<phoning>1</phoning>
<playinginstrument>0</playinginstrument>
<reading>1</reading>
<ridingbike>0</ridingbike>
<ridinghorse>1</ridinghorse>
<running>0</running>
<takingphoto>1</takingphoto>
<usingcomputer>0</usingcomputer>
<walking>1</walking>
</actions>
</object>
</annotation>

Binary file not shown.

After

Width:  |  Height:  |  Size: 635 B

Binary file not shown.

After

Width:  |  Height:  |  Size: 87 B

Binary file not shown.

After

Width:  |  Height:  |  Size: 82 B

@ -0,0 +1,4 @@
classes = 10
train = data/train.txt
names = data/obj.names
backup = backup/

@ -0,0 +1,10 @@
label_0
label_1
label_2
label_3
label_4
label_5
label_6
label_7
label_8
label_9

Binary file not shown.

After

Width:  |  Height:  |  Size: 631 B

@ -0,0 +1,2 @@
2 0.133333 0.300000 0.266667 0.200000
4 0.266667 0.450000 0.133333 0.300000
Loading…
Cancel
Save