Manifest optimization (#3712)

5 years ago · 5b890b1785
parent cf6878e19c
commit 5b890b1785
7 changed files with 324 additions and 254 deletions
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@ -12,10 +12,12 @@ and this project adheres to [Semantic Versioning](https://semver.org/spec/v2.0.0
 - cvat-ui: support cloud storages (<https://github.com/openvinotoolkit/cvat/pull/3372>)
 - interactor: add HRNet interactive segmentation serverless function (<https://github.com/openvinotoolkit/cvat/pull/3740>)
 - Added GPU implementation for SiamMask, reworked tracking approach (<https://github.com/openvinotoolkit/cvat/pull/3571>)
+- Progress bar for manifest creating (<https://github.com/openvinotoolkit/cvat/pull/3712>)

 ### Changed

 - UI tracking has been reworked (<https://github.com/openvinotoolkit/cvat/pull/3571>)
+- Manifest generation: Reduce creating time (<https://github.com/openvinotoolkit/cvat/pull/3712>)

 ### Deprecated

--- a/cvat/apps/engine/migrations/0038_manifest.py
+++ b/cvat/apps/engine/migrations/0038_manifest.py
@ -43,10 +43,11 @@ def migrate2meta(apps, shema_editor):
                    continue
                media_file = os.path.join(data_dir, db_data.video.path)
                logger.info('Preparing of the video meta has begun')
-                meta = VideoManifestManager(manifest_path=upload_dir) \
-                    .prepare_meta(media_file=media_file, force=True)
+                manifest = VideoManifestManager(manifest_path=upload_dir)
+                manifest.link(media_file=media_file, force=True)
+                manifest.init_index()
                with open(meta_path, "w") as meta_file:
-                    for idx, pts, _ in meta:
+                    for idx, pts, _ in manifest.reader:
                        meta_file.write(f"{idx} {pts}\n")
            else:
                name_format = "dummy_{}.txt"
@ -87,12 +88,9 @@ def migrate2manifest(apps, shema_editor):
            if hasattr(db_data, 'video'):
                media_file = os.path.join(data_dir, db_data.video.path)
                manifest = VideoManifestManager(manifest_path=upload_dir)
-                logger.info('Preparing of the video meta information has begun')
-                meta_info = manifest.prepare_meta(media_file=media_file, force=True)
+                manifest.link(media_file=media_file, force=True)
                logger.info('Manifest creating has begun')
-                manifest.create(meta_info)
-                logger.info('Index creating has begun')
-                manifest.init_index()
+                manifest.create()
            else:
                manifest = ImageManifestManager(manifest_path=upload_dir)
                sources = []
@ -105,36 +103,21 @@ def migrate2manifest(apps, shema_editor):
                    sources = [os.path.join(data_dir, db_image.path) for db_image in db_data.images.all().order_by('frame')]
                if any(list(filter(lambda x: x.dimension==DimensionType.DIM_3D, db_data.tasks.all()))):
                    logger.info('Preparing of images 3d meta information has begun')
-                    content = []
-                    for source in sources:
-                        name, ext = os.path.splitext(os.path.relpath(source, upload_dir))
-                        content.append({
-                            'name': name,
-                            'extension': ext
-                        })
+                    manifest.link(sources=sources, data_dir=data_dir, DIM_3D=True)
                else:
                    logger.info('Preparing of 2d images meta information has begun')
-                    meta_info = manifest.prepare_meta(sources=sources, data_dir=data_dir)
-                    content = meta_info.content
+                    manifest.link(sources=sources, data_dir=data_dir)

                if db_data.storage == StorageChoice.SHARE:
                    def _get_frame_step(str_):
                        match = search("step\s*=\s*([1-9]\d*)", str_)
                        return int(match.group(1)) if match else 1
                    logger.info('Data is located on the share, metadata update has been started')
-                    step = _get_frame_step(db_data.frame_filter)
-                    start = db_data.start_frame
-                    stop = db_data.stop_frame + 1
-                    images_range = range(start, stop, step)
-                    result_content = []
-                    for i in range(stop):
-                        item = content.pop(0) if i in images_range else dict()
-                        result_content.append(item)
-                    content = result_content
+                    manifest.step = _get_frame_step(db_data.frame_filter)
+                    manifest.start = db_data.start_frame
+                    manifest.stop = db_data.stop_frame + 1
                logger.info('Manifest creating has begun')
-                manifest.create(content)
-                logger.info('Index creating has begun')
-                manifest.init_index()
+                manifest.create()
            logger.info('Succesfull migration for the data({})'.format(db_data.id))
        except Exception as ex:
            logger.error(str(ex))
--- a/cvat/apps/engine/task.py
+++ b/cvat/apps/engine/task.py
@ -265,7 +265,6 @@ def _create_thread(tid, data, isImport=False):
            media_files = sorted(media['image'])
            content = cloud_storage_manifest.get_subset(media_files)
            manifest.create(content)
-            manifest.init_index()

    av_scan_paths(upload_dir)

@ -424,8 +423,7 @@ def _create_thread(tid, data, isImport=False):
                            video_size = manifest.video_resolution
                            manifest_is_prepared = True
                        except Exception as ex:
-                            if os.path.exists(db_data.get_index_path()):
-                                os.remove(db_data.get_index_path())
+                            manifest.remove()
                            if isinstance(ex, AssertionError):
                                base_msg = str(ex)
                            else:
@ -436,17 +434,16 @@ def _create_thread(tid, data, isImport=False):
                    if not manifest_is_prepared:
                        _update_status('Start prepare a manifest file')
                        manifest = VideoManifestManager(db_data.get_manifest_path())
-                        meta_info = manifest.prepare_meta(
+                        manifest.link(
                            media_file=media_files[0],
                            upload_dir=upload_dir,
                            chunk_size=db_data.chunk_size
                        )
-                        manifest.create(meta_info)
-                        manifest.init_index()
+                        manifest.create()
                        _update_status('A manifest had been created')

-                        all_frames = meta_info.get_size()
-                        video_size = meta_info.frame_sizes
+                        all_frames = len(manifest.reader)
+                        video_size = manifest.reader.resolution
                        manifest_is_prepared = True

                    db_data.size = len(range(db_data.start_frame, min(data['stop_frame'] + 1 \
@ -454,10 +451,8 @@ def _create_thread(tid, data, isImport=False):
                    video_path = os.path.join(upload_dir, media_files[0])
                except Exception as ex:
                    db_data.storage_method = models.StorageMethodChoice.FILE_SYSTEM
-                    if os.path.exists(db_data.get_manifest_path()):
-                        os.remove(db_data.get_manifest_path())
-                    if os.path.exists(db_data.get_index_path()):
-                        os.remove(db_data.get_index_path())
+                    manifest.remove()
+                    del manifest
                    base_msg = str(ex) if isinstance(ex, AssertionError) \
                        else "Uploaded video does not support a quick way of task creating."
                    _update_status("{} The task will be created using the old method".format(base_msg))
@ -465,24 +460,15 @@ def _create_thread(tid, data, isImport=False):
                db_data.size = len(extractor)
                manifest = ImageManifestManager(db_data.get_manifest_path())
                if not manifest_file:
-                    if db_task.dimension == models.DimensionType.DIM_2D:
-                        meta_info = manifest.prepare_meta(
-                            sources=extractor.absolute_source_paths,
-                            meta={ k: {'related_images': related_images[k] } for k in related_images },
-                            data_dir=upload_dir
-                        )
-                        content = meta_info.content
-                    else:
-                        content = []
-                        for source in extractor.absolute_source_paths:
-                            name, ext = os.path.splitext(os.path.relpath(source, upload_dir))
-                            content.append({
-                                'name': name,
-                                'meta': { 'related_images': related_images[''.join((name, ext))] },
-                                'extension': ext
-                            })
-                    manifest.create(content)
-                manifest.init_index()
+                    manifest.link(
+                        sources=extractor.absolute_source_paths,
+                        meta={ k: {'related_images': related_images[k] } for k in related_images },
+                        data_dir=upload_dir,
+                        DIM_3D=(db_task.dimension == models.DimensionType.DIM_3D),
+                    )
+                    manifest.create()
+                else:
+                    manifest.init_index()
                counter = itertools.count()
                for _, chunk_frames in itertools.groupby(extractor.frame_range, lambda x: next(counter) // db_data.chunk_size):
                    chunk_paths = [(extractor.get_path(i), i) for i in chunk_frames]
--- a/cvat/apps/engine/tests/test_rest_api.py
+++ b/cvat/apps/engine/tests/test_rest_api.py
@ -2512,11 +2512,11 @@ def generate_manifest_file(data_type, manifest_path, sources):
    }

    if data_type == 'video':
-        manifest = VideoManifestManager(manifest_path)
+        manifest = VideoManifestManager(manifest_path, create_index=False)
    else:
-        manifest = ImageManifestManager(manifest_path)
-    prepared_meta = manifest.prepare_meta(**kwargs[data_type])
-    manifest.create(prepared_meta)
+        manifest = ImageManifestManager(manifest_path, create_index=False)
+    manifest.link(**kwargs[data_type])
+    manifest.create()

 class TaskDataAPITestCase(APITestCase):
    _image_sizes = {}
--- a/utils/dataset_manifest/core.py
+++ b/utils/dataset_manifest/core.py
@ -6,19 +6,49 @@ import av
 import json
 import os
 from abc import ABC, abstractmethod, abstractproperty
-from collections import OrderedDict
 from contextlib import closing
+from tempfile import NamedTemporaryFile
+
 from PIL import Image
 from .utils import md5_hash, rotate_image

 class VideoStreamReader:
-    def __init__(self, source_path):
-        self.source_path = source_path
-        self._key_frames = OrderedDict()
-        self.frames = 0
+    def __init__(self, source_path, chunk_size, force):
+        self._source_path = source_path
+        self._frames_number = None
+        self._force = force
+        self._upper_bound = 3 * chunk_size + 1

        with closing(av.open(self.source_path, mode='r')) as container:
-            self.width, self.height = self._get_frame_size(container)
+            video_stream = VideoStreamReader._get_video_stream(container)
+            isBreaked = False
+            for packet in container.demux(video_stream):
+                if isBreaked:
+                    break
+                for frame in packet.decode():
+                    # check type of first frame
+                    if not frame.pict_type.name == 'I':
+                        raise Exception('First frame is not key frame')
+
+                    # get video resolution
+                    if video_stream.metadata.get('rotate'):
+                        frame = av.VideoFrame().from_ndarray(
+                            rotate_image(
+                                frame.to_ndarray(format='bgr24'),
+                                360 - int(container.streams.video[0].metadata.get('rotate')),
+                            ),
+                            format ='bgr24',
+                        )
+                    self.height, self.width = (frame.height, frame.width)
+                    # not all videos contain information about numbers of frames
+                    if video_stream.frames:
+                        self._frames_number = video_stream.frames
+                    isBreaked = True
+                    break
+
+    @property
+    def source_path(self):
+        return self._source_path

    @staticmethod
    def _get_video_stream(container):
@ -26,157 +56,186 @@ class VideoStreamReader:
        video_stream.thread_type = 'AUTO'
        return video_stream

-    @staticmethod
-    def _get_frame_size(container):
-        video_stream = VideoStreamReader._get_video_stream(container)
+    def __len__(self):
+        return self._frames_number
+
+    @property
+    def resolution(self):
+        return (self.width, self.height)
+
+    def validate_key_frame(self, container, video_stream, key_frame):
        for packet in container.demux(video_stream):
            for frame in packet.decode():
-                if video_stream.metadata.get('rotate'):
-                    frame = av.VideoFrame().from_ndarray(
-                        rotate_image(
-                            frame.to_ndarray(format='bgr24'),
-                            360 - int(container.streams.video[0].metadata.get('rotate')),
-                        ),
-                        format ='bgr24',
-                    )
-                return frame.width, frame.height
-
-    def check_type_first_frame(self):
-        with closing(av.open(self.source_path, mode='r')) as container:
-            video_stream = self._get_video_stream(container)
+                if md5_hash(frame) != key_frame['md5'] or frame.pts != key_frame['pts']:
+                    return False
+                return True

-            for packet in container.demux(video_stream):
-                for frame in packet.decode():
-                    if not frame.pict_type.name == 'I':
-                        raise Exception('First frame is not key frame')
-                    return
-
-    def check_video_timestamps_sequences(self):
+    def __iter__(self):
        with closing(av.open(self.source_path, mode='r')) as container:
            video_stream = self._get_video_stream(container)
-
-            frame_pts = -1
-            frame_dts = -1
+            frame_pts, frame_dts = -1, -1
+            index, key_frame_number = 0, 0
            for packet in container.demux(video_stream):
                for frame in packet.decode():
-
                    if None not in {frame.pts, frame_pts} and frame.pts <= frame_pts:
                        raise Exception('Invalid pts sequences')
-
                    if None not in {frame.dts, frame_dts} and frame.dts <= frame_dts:
                        raise Exception('Invalid dts sequences')
-
                    frame_pts, frame_dts = frame.pts, frame.dts

-    def rough_estimate_frames_ratio(self, upper_bound):
-        analyzed_frames_number, key_frames_number = 0, 0
-        _processing_end = False
-
-        with closing(av.open(self.source_path, mode='r')) as container:
-            video_stream = self._get_video_stream(container)
-            for packet in container.demux(video_stream):
-                for frame in packet.decode():
                    if frame.key_frame:
-                        key_frames_number += 1
-                    analyzed_frames_number += 1
-                    if upper_bound == analyzed_frames_number:
-                        _processing_end = True
-                        break
-                if _processing_end:
-                    break
-        # In our case no videos with non-key first frame, so 1 key frame is guaranteed
-        return analyzed_frames_number // key_frames_number
-
-    def validate_frames_ratio(self, chunk_size):
-        upper_bound = 3 * chunk_size
-        ratio = self.rough_estimate_frames_ratio(upper_bound + 1)
-        assert ratio < upper_bound, 'Too few keyframes'
+                        key_frame_number += 1
+                        ratio = (index + 1) // key_frame_number

-    def get_size(self):
-        return self.frames
-
-    @property
-    def frame_sizes(self):
-        return (self.width, self.height)
+                        if ratio >= self._upper_bound and not self._force:
+                            raise AssertionError('Too few keyframes')

-    def validate_key_frame(self, container, video_stream, key_frame):
-        for packet in container.demux(video_stream):
-            for frame in packet.decode():
-                if md5_hash(frame) != key_frame[1]['md5'] or frame.pts != key_frame[1]['pts']:
-                    self._key_frames.pop(key_frame[0])
-                return
-
-    def validate_seek_key_frames(self):
-        with closing(av.open(self.source_path, mode='r')) as container:
-            video_stream = self._get_video_stream(container)
-
-            key_frames_copy = self._key_frames.copy()
+                        key_frame = {
+                            'index': index,
+                            'pts': frame.pts,
+                            'md5': md5_hash(frame)
+                        }

-            for key_frame in key_frames_copy.items():
-                container.seek(offset=key_frame[1]['pts'], stream=video_stream)
-                self.validate_key_frame(container, video_stream, key_frame)
+                        with closing(av.open(self.source_path, mode='r')) as checked_container:
+                            checked_container.seek(offset=key_frame['pts'], stream=video_stream)
+                            isValid = self.validate_key_frame(checked_container, video_stream, key_frame)
+                            if isValid:
+                                yield (index, key_frame['pts'], key_frame['md5'])
+                    else:
+                        yield index
+                    index += 1
+            if not self._frames_number:
+                self._frames_number = index
+
+class KeyFramesVideoStreamReader(VideoStreamReader):
+    def __init__(self, **kwargs):
+        super().__init__(**kwargs)

-    def save_key_frames(self):
+    def __iter__(self):
        with closing(av.open(self.source_path, mode='r')) as container:
            video_stream = self._get_video_stream(container)
-            frame_number = 0
-
+            frame_pts, frame_dts = -1, -1
+            index, key_frame_number = 0, 0
            for packet in container.demux(video_stream):
                for frame in packet.decode():
+                    if None not in {frame.pts, frame_pts} and frame.pts <= frame_pts:
+                        raise Exception('Invalid pts sequences')
+                    if None not in {frame.dts, frame_dts} and frame.dts <= frame_dts:
+                        raise Exception('Invalid dts sequences')
+                    frame_pts, frame_dts = frame.pts, frame.dts
+
                    if frame.key_frame:
-                        self._key_frames[frame_number] = {
+                        key_frame_number += 1
+                        ratio = (index + 1) // key_frame_number
+                        if ratio >= self._upper_bound and not self._force:
+                            raise AssertionError('Too few keyframes')
+                        key_frame = {
+                            'index': index,
                            'pts': frame.pts,
-                            'md5': md5_hash(frame),
+                            'md5': md5_hash(frame)
                        }
-                    frame_number += 1
-            self.frames = frame_number
-
-    @property
-    def key_frames(self):
-        return self._key_frames
-
-    def __len__(self):
-        return len(self._key_frames)
-
-    #TODO: need to change it in future
-    def __iter__(self):
-        for idx, key_frame in self._key_frames.items():
-            yield (idx, key_frame['pts'], key_frame['md5'])

+                        with closing(av.open(self.source_path, mode='r')) as checked_container:
+                            checked_container.seek(offset=key_frame['pts'], stream=video_stream)
+                            isValid = self.validate_key_frame(checked_container, video_stream, key_frame)
+                            if isValid:
+                                yield (index, key_frame['pts'], key_frame['md5'])
+                    index += 1

 class DatasetImagesReader:
-    def __init__(self, sources, meta=None, is_sorted=True, use_image_hash=False, *args, **kwargs):
+    def __init__(self,
+                sources,
+                meta=None,
+                is_sorted=True,
+                use_image_hash=False,
+                start = 0,
+                step = 1,
+                stop = None,
+                *args,
+                **kwargs):
        self._sources = sources if is_sorted else sorted(sources)
        self._meta = meta
-        self._content = []
        self._data_dir = kwargs.get('data_dir', None)
        self._use_image_hash = use_image_hash
+        self._start = start
+        self._stop = stop if stop else len(sources)
+        self._step = step
+
+    @property
+    def start(self):
+        return self._start
+
+    @start.setter
+    def start(self, value):
+        self._start = int(value)
+
+    @property
+    def stop(self):
+        return self._stop
+
+    @stop.setter
+    def stop(self, value):
+        self._stop = int(value)
+
+    @property
+    def step(self):
+        return self._step
+
+    @step.setter
+    def step(self, value):
+        self._step = int(value)

    def __iter__(self):
-        for image in self._sources:
-            img = Image.open(image, mode='r')
-            img_name = os.path.relpath(image, self._data_dir) if self._data_dir \
-                else os.path.basename(image)
-            name, extension = os.path.splitext(img_name)
-            image_properties = {
-                'name': name.replace('\\', '/'),
-                'extension': extension,
-                'width': img.width,
-                'height': img.height,
-            }
-            if self._meta and img_name in self._meta:
-                image_properties['meta'] = self._meta[img_name]
-            if self._use_image_hash:
-                image_properties['checksum'] = md5_hash(img)
-            yield image_properties
-
-    def create(self):
-        for item in self:
-            self._content.append(item)
+        sources = (i for i in self._sources)
+        for idx in range(self._stop):
+            if idx in self.range_:
+                image = next(sources)
+                img = Image.open(image, mode='r')
+                img_name = os.path.relpath(image, self._data_dir) if self._data_dir \
+                    else os.path.basename(image)
+                name, extension = os.path.splitext(img_name)
+                image_properties = {
+                    'name': name.replace('\\', '/'),
+                    'extension': extension,
+                    'width': img.width,
+                    'height': img.height,
+                }
+                if self._meta and img_name in self._meta:
+                    image_properties['meta'] = self._meta[img_name]
+                if self._use_image_hash:
+                    image_properties['checksum'] = md5_hash(img)
+                yield image_properties
+            else:
+                yield dict()

    @property
-    def content(self):
-        return self._content
+    def range_(self):
+        return range(self._start, self._stop, self._step)
+
+    def __len__(self):
+        return len(self.range_)
+
+class Dataset3DImagesReader(DatasetImagesReader):
+    def __init__(self, **kwargs):
+        super().__init__(**kwargs)
+
+    def __iter__(self):
+        sources = (i for i in self._sources)
+        for idx in range(self._stop):
+            if idx in self.range_:
+                image = next(sources)
+                img_name = os.path.relpath(image, self._data_dir) if self._data_dir \
+                    else os.path.basename(image)
+                name, extension = os.path.splitext(img_name)
+                image_properties = {
+                    'name': name,
+                    'extension': extension,
+                }
+                if self._meta and img_name in self._meta:
+                    image_properties['meta'] = self._meta[img_name]
+                yield image_properties
+            else:
+                yield dict()

 class _Manifest:
    FILE_NAME = 'manifest.jsonl'
@ -257,6 +316,13 @@ class _Index:
    def __len__(self):
        return len(self._index)

+def _set_index(func):
+    def wrapper(self, *args, **kwargs):
+        func(self, *args,  **kwargs)
+        if self._create_index:
+            self.set_index()
+    return wrapper
+
 class _ManifestManager(ABC):
    BASE_INFORMATION = {
        'version' : 1,
@ -268,9 +334,15 @@ class _ManifestManager(ABC):
            if state.get(item, None) is None:
                raise Exception(f"Invalid '{self.manifest.name} file structure': '{item}' is required, but not found")

-    def __init__(self, path, upload_dir=None, *args, **kwargs):
+    def __init__(self, path, create_index, upload_dir=None, *args, **kwargs):
        self._manifest = _Manifest(path, upload_dir)
        self._index = _Index(os.path.dirname(self._manifest.path))
+        self._reader = None
+        self._create_index = create_index
+
+    @property
+    def reader(self):
+        return self._reader

    def _parse_line(self, line):
        """ Getting a random line from the manifest file """
@ -305,8 +377,13 @@ class _ManifestManager(ABC):
        self.reset_index()
        self.init_index()

+    def remove(self):
+        self.reset_index()
+        if os.path.exists(self.path):
+            os.remove(self.path)
+
    @abstractmethod
-    def create(self, content, **kwargs):
+    def create(self, content=None, _tqdm=None):
        pass

    @abstractmethod
@ -355,53 +432,65 @@ class _ManifestManager(ABC):
 class VideoManifestManager(_ManifestManager):
    _requared_item_attributes = {'number', 'pts'}

-    def __init__(self, manifest_path):
-        super().__init__(manifest_path)
+    def __init__(self, manifest_path, create_index=True):
+        super().__init__(manifest_path, create_index)
        setattr(self._manifest, 'TYPE', 'video')
        self.BASE_INFORMATION['properties'] = 3

-    def create(self, content, **kwargs):
-        """ Creating and saving a manifest file """
-        with open(self._manifest.path, 'w') as manifest_file:
-            base_info = {
-                'version': self._manifest.VERSION,
-                'type': self._manifest.TYPE,
-                'properties': {
-                    'name': os.path.basename(content.source_path),
-                    'resolution': content.frame_sizes,
-                    'length': content.get_size(),
-                },
-            }
-            for key, value in base_info.items():
-                json_item = json.dumps({key: value}, separators=(',', ':'))
-                manifest_file.write(f'{json_item}\n')
-
-            for item in content:
+    def link(self, media_file, upload_dir=None, chunk_size=36, force=False, only_key_frames=False, **kwargs):
+        ReaderClass = VideoStreamReader if not only_key_frames else KeyFramesVideoStreamReader
+        self._reader = ReaderClass(
+            os.path.join(upload_dir, media_file) if upload_dir else media_file,
+            chunk_size,
+            force)
+
+    def _write_base_information(self, file):
+        base_info = {
+            'version': self._manifest.VERSION,
+            'type': self._manifest.TYPE,
+            'properties': {
+                'name': os.path.basename(self._reader.source_path),
+                'resolution': self._reader.resolution,
+                'length': len(self._reader),
+            },
+        }
+        for key, value in base_info.items():
+            json_item = json.dumps({key: value}, separators=(',', ':'))
+            file.write(f'{json_item}\n')
+
+    def _write_core_part(self, file, _tqdm):
+        iterable_obj = self._reader if _tqdm is None else \
+            _tqdm(self._reader, desc="Manifest creating", total=len(self._reader))
+        for item in iterable_obj:
+            if isinstance(item, tuple):
                json_item = json.dumps({
                    'number': item[0],
                    'pts': item[1],
                    'checksum': item[2]
                }, separators=(',', ':'))
-                manifest_file.write(f"{json_item}\n")
+                file.write(f"{json_item}\n")
+
+    # pylint: disable=arguments-differ
+    @_set_index
+    def create(self, _tqdm=None):
+        """ Creating and saving a manifest file """
+        if not len(self._reader):
+            with NamedTemporaryFile(mode='w', delete=False)as tmp_file:
+                self._write_core_part(tmp_file, _tqdm)
+            temp = tmp_file.name
+            with open(self._manifest.path, 'w') as manifest_file:
+                self._write_base_information(manifest_file)
+                with open(temp, 'r') as tmp_file:
+                    manifest_file.write(tmp_file.read())
+            os.remove(temp)
+        else:
+            with open(self._manifest.path, 'w') as manifest_file:
+                self._write_base_information(manifest_file)
+                self._write_core_part(manifest_file, _tqdm)

    def partial_update(self, number, properties):
        pass

-    @staticmethod
-    def prepare_meta(media_file, upload_dir=None, chunk_size=36, force=False):
-        source_path = os.path.join(upload_dir, media_file) if upload_dir else media_file
-        meta_info = VideoStreamReader(source_path=source_path)
-        meta_info.check_type_first_frame()
-        try:
-            meta_info.validate_frames_ratio(chunk_size)
-        except AssertionError:
-            if not force:
-                raise
-        meta_info.check_video_timestamps_sequences()
-        meta_info.save_key_frames()
-        meta_info.validate_seek_key_frames()
-        return meta_info
-
    @property
    def video_name(self):
        return self['properties']['name']
@ -430,7 +519,7 @@ class ManifestValidator:

 class VideoManifestValidator(VideoManifestManager):
    def __init__(self, source_path, manifest_path):
-        self.source_path = source_path
+        self._source_path = source_path
        super().__init__(manifest_path)

    @staticmethod
@ -446,7 +535,7 @@ class VideoManifestValidator(VideoManifestManager):
                return

    def validate_seek_key_frames(self):
-        with closing(av.open(self.source_path, mode='r')) as container:
+        with closing(av.open(self._source_path, mode='r')) as container:
            video_stream = self._get_video_stream(container)
            last_key_frame = None

@ -459,7 +548,7 @@ class VideoManifestValidator(VideoManifestManager):
                last_key_frame = key_frame

    def validate_frame_numbers(self):
-        with closing(av.open(self.source_path, mode='r')) as container:
+        with closing(av.open(self._source_path, mode='r')) as container:
            video_stream = self._get_video_stream(container)
            # not all videos contain information about numbers of frames
            frames = video_stream.frames
@ -470,36 +559,44 @@ class VideoManifestValidator(VideoManifestManager):
 class ImageManifestManager(_ManifestManager):
    _requared_item_attributes = {'name', 'extension'}

-    def __init__(self, manifest_path, upload_dir=None):
-        super().__init__(manifest_path, upload_dir)
+    def __init__(self, manifest_path, upload_dir=None, create_index=True):
+        super().__init__(manifest_path, create_index, upload_dir)
        setattr(self._manifest, 'TYPE', 'images')

-    def create(self, content, **kwargs):
-        """ Creating and saving a manifest file"""
+    def link(self, **kwargs):
+        ReaderClass = DatasetImagesReader if not kwargs.get('DIM_3D', None) else Dataset3DImagesReader
+        self._reader = ReaderClass(**kwargs)
+
+    def _write_base_information(self, file):
+        base_info = {
+            'version': self._manifest.VERSION,
+            'type': self._manifest.TYPE,
+        }
+        for key, value in base_info.items():
+            json_line = json.dumps({key: value}, separators=(',', ':'))
+            file.write(f'{json_line}\n')
+
+    def _write_core_part(self, file, obj, _tqdm):
+        iterable_obj = obj if _tqdm is None else \
+            _tqdm(obj, desc="Manifest creating",
+                  total=None if not hasattr(obj, '__len__') else len(obj))
+        for image_properties in iterable_obj:
+            json_line = json.dumps({
+                key: value for key, value in image_properties.items()
+            }, separators=(',', ':'))
+            file.write(f"{json_line}\n")
+
+    @_set_index
+    def create(self, content=None, _tqdm=None):
+        """ Creating and saving a manifest file for the specialized dataset"""
        with open(self._manifest.path, 'w') as manifest_file:
-            base_info = {
-                'version': self._manifest.VERSION,
-                'type': self._manifest.TYPE,
-            }
-            for key, value in base_info.items():
-                json_item = json.dumps({key: value}, separators=(',', ':'))
-                manifest_file.write(f'{json_item}\n')
-
-            for item in content:
-                json_item = json.dumps({
-                    key: value for key, value in item.items()
-                }, separators=(',', ':'))
-                manifest_file.write(f"{json_item}\n")
+            self._write_base_information(manifest_file)
+            obj = content if content else self._reader
+            self._write_core_part(manifest_file, obj, _tqdm)

    def partial_update(self, number, properties):
        pass

-    @staticmethod
-    def prepare_meta(sources, **kwargs):
-        meta_info = DatasetImagesReader(sources=sources, **kwargs)
-        meta_info.create()
-        return meta_info
-
    @property
    def data(self):
        return (f"{image['name']}{image['extension']}" for _, image in self)
@ -512,4 +609,4 @@ class ImageManifestManager(_ManifestManager):
            'height': image['height'],
            'meta': image['meta'],
            'checksum': f"{image['checksum']}"
-        } for _, image in self if f"{image['name']}{image['extension']}" in subset_names)
+        } for _, image in self if f"{image['name']}{image['extension']}" in subset_names)
--- a/utils/dataset_manifest/create.py
+++ b/utils/dataset_manifest/create.py
@ -6,6 +6,7 @@ import os
 import sys
 import re
 from glob import glob
+from tqdm import tqdm

 from utils import detect_related_images, is_image, is_video

@ -61,17 +62,18 @@ def main():
        try:
            assert len(sources), 'A images was not found'
            manifest = ImageManifestManager(manifest_path=manifest_directory)
-            meta_info = manifest.prepare_meta(sources=sources, meta=meta, is_sorted=False,
-                use_image_hash=True, data_dir=data_dir)
-            manifest.create(meta_info)
+            manifest.link(sources=sources, meta=meta, is_sorted=False,
+                    use_image_hash=True, data_dir=data_dir)
+            manifest.create(_tqdm=tqdm)
        except Exception as ex:
            sys.exit(str(ex))
    else: # video
        try:
            assert is_video(source), 'You can specify a video path or a directory/pattern with images'
            manifest = VideoManifestManager(manifest_path=manifest_directory)
+            manifest.link(media_file=source, force=args.force)
            try:
-                meta_info = manifest.prepare_meta(media_file=source, force=args.force)
+                manifest.create(_tqdm=tqdm)
            except AssertionError as ex:
                if str(ex) == 'Too few keyframes':
                    msg = 'NOTE: prepared manifest file contains too few key frames for smooth decoding.\n' \
@ -80,7 +82,6 @@ def main():
                    sys.exit(2)
                else:
                    raise
-            manifest.create(meta_info)
        except Exception as ex:
            sys.exit(str(ex))

--- a/utils/dataset_manifest/requirements.txt
+++ b/utils/dataset_manifest/requirements.txt
@ -1,3 +1,4 @@
 av==8.0.2 --no-binary=av
 opencv-python-headless==4.4.0.42
-Pillow==7.2.0
+Pillow==7.2.0
+tqdm==4.58.0