You cannot select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
150 lines
5.9 KiB
Python
150 lines
5.9 KiB
Python
# Copyright (C) 2019 Intel Corporation
|
|
#
|
|
# SPDX-License-Identifier: MIT
|
|
|
|
import math
|
|
from io import BytesIO
|
|
from enum import Enum
|
|
|
|
import numpy as np
|
|
from PIL import Image
|
|
|
|
from cvat.apps.engine.media_extractors import VideoReader, ZipReader
|
|
from cvat.apps.engine.models import DataChoice
|
|
from cvat.apps.engine.mime_types import mimetypes
|
|
|
|
|
|
class FrameProvider():
|
|
class Quality(Enum):
|
|
COMPRESSED = 0
|
|
ORIGINAL = 100
|
|
|
|
class Type(Enum):
|
|
BUFFER = 0
|
|
PIL = 1
|
|
NUMPY_ARRAY = 2
|
|
|
|
def __init__(self, db_data):
|
|
self._db_data = db_data
|
|
if db_data.compressed_chunk_type == DataChoice.IMAGESET:
|
|
self._compressed_chunk_reader_class = ZipReader
|
|
elif db_data.compressed_chunk_type == DataChoice.VIDEO:
|
|
self._compressed_chunk_reader_class = VideoReader
|
|
else:
|
|
raise Exception('Unsupported chunk type')
|
|
|
|
if db_data.original_chunk_type == DataChoice.IMAGESET:
|
|
self._original_chunk_reader_class = ZipReader
|
|
elif db_data.original_chunk_type == DataChoice.VIDEO:
|
|
self._original_chunk_reader_class = VideoReader
|
|
else:
|
|
raise Exception('Unsupported chunk type')
|
|
|
|
self._extracted_compressed_chunk = None
|
|
self._compressed_chunk_reader = None
|
|
self._extracted_original_chunk = None
|
|
self._original_chunk_reader = None
|
|
|
|
def __len__(self):
|
|
return self._db_data.size
|
|
|
|
def _validate_frame_number(self, frame_number):
|
|
frame_number_ = int(frame_number)
|
|
if frame_number_ < 0 or frame_number_ >= self._db_data.size:
|
|
raise Exception('Incorrect requested frame number: {}'.format(frame_number_))
|
|
|
|
chunk_number = frame_number_ // self._db_data.chunk_size
|
|
frame_offset = frame_number_ % self._db_data.chunk_size
|
|
|
|
return frame_number_, chunk_number, frame_offset
|
|
|
|
def _validate_chunk_number(self, chunk_number):
|
|
chunk_number_ = int(chunk_number)
|
|
if chunk_number_ < 0 or chunk_number_ >= math.ceil(self._db_data.size / self._db_data.chunk_size):
|
|
raise Exception('requested chunk does not exist')
|
|
|
|
return chunk_number_
|
|
|
|
@staticmethod
|
|
def _av_frame_to_png_bytes(av_frame):
|
|
pil_img = av_frame.to_image()
|
|
buf = BytesIO()
|
|
pil_img.save(buf, format='PNG')
|
|
buf.seek(0)
|
|
return buf
|
|
|
|
def _get_frame(self, frame_number, chunk_path_getter, extracted_chunk, chunk_reader, reader_class):
|
|
_, chunk_number, frame_offset = self._validate_frame_number(frame_number)
|
|
chunk_path = chunk_path_getter(chunk_number)
|
|
if chunk_number != extracted_chunk:
|
|
extracted_chunk = chunk_number
|
|
chunk_reader = reader_class([chunk_path])
|
|
|
|
frame, frame_name = chunk_reader[frame_offset]
|
|
if reader_class is VideoReader:
|
|
return (self._av_frame_to_png_bytes(frame), 'image/png')
|
|
|
|
return (frame, mimetypes.guess_type(frame_name))
|
|
|
|
def _get_frames(self, chunk_path_getter, reader_class, out_type):
|
|
for chunk_idx in range(math.ceil(self._db_data.size / self._db_data.chunk_size)):
|
|
chunk_path = chunk_path_getter(chunk_idx)
|
|
chunk_reader = reader_class([chunk_path])
|
|
for frame, _ in chunk_reader:
|
|
if out_type == self.Type.BUFFER:
|
|
yield self._av_frame_to_png_bytes(frame) if reader_class is VideoReader else frame
|
|
elif out_type == self.Type.PIL:
|
|
yield frame.to_image() if reader_class is VideoReader else Image.open(frame)
|
|
elif out_type == self.Type.NUMPY_ARRAY:
|
|
if reader_class is VideoReader:
|
|
image = np.array(frame.to_image())
|
|
else:
|
|
image = np.array(Image.open(frame))
|
|
if len(image.shape) == 3 and image.shape[2] in {3, 4}:
|
|
image[:, :, :3] = image[:, :, 2::-1] # RGB to BGR
|
|
yield image
|
|
else:
|
|
raise Exception('unsupported output type')
|
|
|
|
def get_preview(self):
|
|
return self._db_data.get_preview_path()
|
|
|
|
def get_chunk(self, chunk_number, quality=Quality.ORIGINAL):
|
|
chunk_number = self._validate_chunk_number(chunk_number)
|
|
if quality == self.Quality.ORIGINAL:
|
|
return self._db_data.get_original_chunk_path(chunk_number)
|
|
elif quality == self.Quality.COMPRESSED:
|
|
return self._db_data.get_compressed_chunk_path(chunk_number)
|
|
|
|
def get_frame(self, frame_number, quality=Quality.ORIGINAL):
|
|
if quality == self.Quality.ORIGINAL:
|
|
return self._get_frame(
|
|
frame_number=frame_number,
|
|
chunk_path_getter=self._db_data.get_original_chunk_path,
|
|
extracted_chunk=self._extracted_original_chunk,
|
|
chunk_reader=self._original_chunk_reader,
|
|
reader_class=self._original_chunk_reader_class,
|
|
)
|
|
elif quality == self.Quality.COMPRESSED:
|
|
return self._get_frame(
|
|
frame_number=frame_number,
|
|
chunk_path_getter=self._db_data.get_compressed_chunk_path,
|
|
extracted_chunk=self._extracted_compressed_chunk,
|
|
chunk_reader=self._compressed_chunk_reader,
|
|
reader_class=self._compressed_chunk_reader_class,
|
|
)
|
|
|
|
def get_frames(self, quality=Quality.ORIGINAL, out_type=Type.BUFFER):
|
|
if quality == self.Quality.ORIGINAL:
|
|
return self._get_frames(
|
|
chunk_path_getter=self._db_data.get_original_chunk_path,
|
|
reader_class=self._original_chunk_reader_class,
|
|
out_type=out_type,
|
|
)
|
|
elif quality == self.Quality.COMPRESSED:
|
|
return self._get_frames(
|
|
chunk_path_getter=self._db_data.get_compressed_chunk_path,
|
|
reader_class=self._compressed_chunk_reader_class,
|
|
out_type=out_type,
|
|
)
|