Source code for compressai.datasets.vimeo90k
# Copyright (c) 2021-2024, InterDigital Communications, Inc
# All rights reserved.
# Redistribution and use in source and binary forms, with or without
# modification, are permitted (subject to the limitations in the disclaimer
# below) provided that the following conditions are met:
# * Redistributions of source code must retain the above copyright notice,
# this list of conditions and the following disclaimer.
# * Redistributions in binary form must reproduce the above copyright notice,
# this list of conditions and the following disclaimer in the documentation
# and/or other materials provided with the distribution.
# * Neither the name of InterDigital Communications, Inc nor the names of its
# contributors may be used to endorse or promote products derived from this
# software without specific prior written permission.
# NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE GRANTED BY
# THIS LICENSE. THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND
# CONTRIBUTORS "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT
# NOT LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A
# PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR
# CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
# EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
# PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS;
# OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
# WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR
# OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF
# ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
from pathlib import Path
from PIL import Image
from torch.utils.data import Dataset
from compressai.registry import register_dataset
[docs]
@register_dataset("Vimeo90kDataset")
class Vimeo90kDataset(Dataset):
"""Load a Vimeo-90K structured dataset.
Vimeo-90K dataset from
Tianfan Xue, Baian Chen, Jiajun Wu, Donglai Wei, William T. Freeman:
`"Video Enhancement with Task-Oriented Flow"
<https://arxiv.org/abs/1711.09078>`_,
International Journal of Computer Vision (IJCV), 2019.
Training and testing image samples are respectively stored in
separate directories:
.. code-block::
- rootdir/
- sequence/
- 00001/001/im1.png
- 00001/001/im2.png
- 00001/001/im3.png
Args:
root (string): root directory of the dataset
transform (callable, optional): a function or transform that takes in a
PIL image and returns a transformed version
split (string): split mode ('train' or 'valid')
tuplet (int): order of dataset tuplet (e.g. 3 for "triplet" dataset)
"""
def __init__(self, root, transform=None, split="train", tuplet=3):
list_path = Path(root) / self._list_filename(split, tuplet)
with open(list_path) as f:
self.samples = [
f"{root}/sequences/{line.rstrip()}/im{idx}.png"
for line in f
if line.strip() != ""
for idx in range(1, tuplet + 1)
]
self.transform = transform
def __getitem__(self, index):
"""
Args:
index (int): Index
Returns:
img: `PIL.Image.Image` or transformed `PIL.Image.Image`.
"""
img = Image.open(self.samples[index]).convert("RGB")
if self.transform:
return self.transform(img)
return img
def __len__(self):
return len(self.samples)
def _list_filename(self, split: str, tuplet: int) -> str:
tuplet_prefix = {3: "tri", 7: "sep"}[tuplet]
list_suffix = {"train": "trainlist", "valid": "testlist"}[split]
return f"{tuplet_prefix}_{list_suffix}.txt"