Add ImageNetv2 to tfds

PiperOrigin-RevId: 321254456
tensorflow · Jul 14, 2020 · 5859615 · 5859615
1 parent ae9c381
commit 5859615
Show file tree

Hide file tree

Showing 37 changed files with 187 additions and 0 deletions.
diff --git a/tensorflow_datasets/image_classification/__init__.py b/tensorflow_datasets/image_classification/__init__.py
@@ -50,6 +50,7 @@
 from tensorflow_datasets.image_classification.imagenet2012_subset import Imagenet2012Subset
 from tensorflow_datasets.image_classification.imagenet_a import ImagenetA
 from tensorflow_datasets.image_classification.imagenet_resized import ImagenetResized
+from tensorflow_datasets.image_classification.imagenet_v2 import ImagenetV2
 from tensorflow_datasets.image_classification.imagenette import Imagenette
 from tensorflow_datasets.image_classification.imagewang import Imagewang
 from tensorflow_datasets.image_classification.inaturalist import INaturalist2017

diff --git a/tensorflow_datasets/image_classification/imagenet_v2.py b/tensorflow_datasets/image_classification/imagenet_v2.py
@@ -0,0 +1,147 @@
+# coding=utf-8
+# Copyright 2020 The TensorFlow Datasets Authors.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+# Lint as: python3
+"""The ImageNet-v2 image classification dataset."""
+import os
+import tensorflow.compat.v2 as tf
+import tensorflow_datasets.public_api as tfds
+
+
+_CITATION = r"""
+@inproceedings{recht2019imagenet,
+  title={Do ImageNet Classifiers Generalize to ImageNet?},
+  author={Recht, Benjamin and Roelofs, Rebecca and Schmidt, Ludwig and Shankar, Vaishaal},
+  booktitle={International Conference on Machine Learning},
+  pages={5389--5400},
+  year={2019}
+}
+"""
+
+_DESCRIPTION = """
+ImageNet-v2 is an ImageNet test set (10 per class) collected by closely
+following the original labelling protocol. Each image has been labelled by
+at least 10 MTurk workers, possibly more, and depending on the strategy used to
+select which images to include among the 10 chosen for the given class there are
+three different versions of the dataset. Please refer to section four of the
+paper for more details on how the different variants were compiled.
+
+The label space is the same as that of ImageNet2012. Each example is
+represented as a dictionary with the following keys:
+
+* 'image': The image, a (H, W, 3)-tensor.
+* 'label': An integer in the range [0, 1000).
+* 'file_name': A unique sting identifying the example within the dataset.
+"""
+
+# Note: Bump the version if the links change.
+_VERSION = tfds.core.Version('0.1.0')
+_ROOT_URL = 'https://s3-us-west-2.amazonaws.com/imagenetv2public'
+_IMAGENET_V2_URLS = {
+    'matched-frequency': _ROOT_URL + '/imagenetv2-matched-frequency.tar.gz',
+    'threshold-0.7': _ROOT_URL + '/imagenetv2-threshold0.7.tar.gz',
+    'topimages': _ROOT_URL + '/imagenetv2-topimages.tar.gz',
+}
+_TAR_TOPDIR = {
+    'matched-frequency': 'imagenetv2-matched-frequency',
+    'threshold-0.7': 'imagenetv2-threshold0.7',
+    'topimages': 'imagenetv2-topimages',
+}
+
+_IMAGENET_LABELS_FILENAME = r'image_classification/imagenet2012_labels.txt'
+
+
+class ImagenetV2Config(tfds.core.BuilderConfig):
+  """"Configuration specifying the variant to use."""
+
+  @tfds.core.disallow_positional_args
+  def __init__(self, variant, **kwargs):
+    """The parameters specifying how the dataset will be processed.
+
+    The dataset comes in three different variants. Please refer to the paper
+    on more details how they were collected.
+
+    Args:
+      variant: One of 'matched-frequency', 'threshold-0.7', or 'topimages'.
+      **kwargs: Passed on to the constructor of `BuilderConfig`.
+    """
+    super(ImagenetV2Config, self).__init__(**kwargs)
+    if variant not in _IMAGENET_V2_URLS:
+      raise ValueError('Unknown split number {}, must be one of {}'.format(
+          variant, list(_IMAGENET_V2_URLS)))
+    self.variant = variant
+
+
+def _create_builder_configs():
+  for variant in _IMAGENET_V2_URLS:
+    yield ImagenetV2Config(variant=variant,
+                           name=variant,
+                           version=_VERSION,
+                           description=_DESCRIPTION)
+
+
+class ImagenetV2(tfds.core.GeneratorBasedBuilder):
+  """An ImageNet test set recollected by following the original protocol."""
+
+  BUILDER_CONFIGS = list(_create_builder_configs())
+
+  def _info(self):
+    names_file = tfds.core.get_tfds_path(_IMAGENET_LABELS_FILENAME)
+    return tfds.core.DatasetInfo(
+        builder=self,
+        # This is the description that will appear on the datasets page.
+        description=_DESCRIPTION,
+        # tfds.features.FeatureConnectors
+        features=tfds.features.FeaturesDict({
+            'image': tfds.features.Image(encoding_format='jpeg'),
+            'label': tfds.features.ClassLabel(names_file=names_file),
+            'file_name': tfds.features.Text(),
+        }),
+        # Used if as_supervised=True in builder.as_dataset.
+        supervised_keys=('image', 'label'),
+        # Homepage of the dataset for documentation
+        homepage='https://github.com/modestyachts/ImageNetV2',
+        citation=_CITATION,
+    )
+
+  def _split_generators(self, dl_manager):
+    """Returns a SplitGenerator for the test set."""
+    variant_url = _IMAGENET_V2_URLS[self.builder_config.variant]
+    imagenet_v2_root = os.path.join(
+        dl_manager.download_and_extract(variant_url),
+        _TAR_TOPDIR[self.builder_config.variant])
+    return [
+        tfds.core.SplitGenerator(
+            # The dataset provides only a test split.
+            name=tfds.Split.TEST,
+            # These kwargs will be passed to _generate_examples
+            gen_kwargs={'imagenet_v2_root': imagenet_v2_root},
+        ),
+    ]
+
+  def _generate_examples(self, imagenet_v2_root):
+    """Yields the examples."""
+    # The directory structure is `class_number/filename_number.jpg`, where
+    # class_number is in [0, 1000) and filename_number in [0, 10).
+    for class_id in tf.io.gfile.listdir(imagenet_v2_root):
+      class_dir = os.path.join(imagenet_v2_root, class_id)
+      for image_filename in tf.io.gfile.listdir(class_dir):
+        image_path = os.path.join(class_dir, image_filename)
+        features = {
+            'image': image_path,
+            'label': int(class_id),
+            'file_name': image_path,
+        }
+        yield image_path, features
diff --git a/tensorflow_datasets/image_classification/imagenet_v2_test.py b/tensorflow_datasets/image_classification/imagenet_v2_test.py
@@ -0,0 +1,36 @@
+# coding=utf-8
+# Copyright 2020 The TensorFlow Datasets Authors.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+# Lint as: python3
+from tensorflow_datasets.image_classification import imagenet_v2
+import tensorflow_datasets.public_api as tfds
+
+
+class ImagenetV2Test(tfds.testing.DatasetBuilderTestCase):
+
+  BUILDER_CONFIG_NAMES_TO_TEST = ['matched-frequency',
+                                  'threshold-0.7',
+                                  'topimages']
+
+  DATASET_CLASS = imagenet_v2.ImagenetV2
+  SPLITS = {
+      'test': 10,  # Number of fake test examples.
+  }
+
+  DL_EXTRACT_RESULT = ''
+
+
+if __name__ == '__main__':
+  tfds.testing.test_main()
diff --git a/tensorflow_datasets/testing/test_data/fake_examples/imagenet_v2/125/3.jpeg b/tensorflow_datasets/testing/test_data/fake_examples/imagenet_v2/125/3.jpeg
diff --git a/tensorflow_datasets/testing/test_data/fake_examples/imagenet_v2/125/4.jpeg b/tensorflow_datasets/testing/test_data/fake_examples/imagenet_v2/125/4.jpeg
diff --git a/tensorflow_datasets/testing/test_data/fake_examples/imagenet_v2/125/5.jpeg b/tensorflow_datasets/testing/test_data/fake_examples/imagenet_v2/125/5.jpeg
diff --git a/...ing/test_data/fake_examples/imagenet_v2/imagenetv2-matched-frequency/125/3.jpeg b/...ing/test_data/fake_examples/imagenet_v2/imagenetv2-matched-frequency/125/3.jpeg
diff --git a/...ing/test_data/fake_examples/imagenet_v2/imagenetv2-matched-frequency/125/4.jpeg b/...ing/test_data/fake_examples/imagenet_v2/imagenetv2-matched-frequency/125/4.jpeg
diff --git a/...ing/test_data/fake_examples/imagenet_v2/imagenetv2-matched-frequency/125/5.jpeg b/...ing/test_data/fake_examples/imagenet_v2/imagenetv2-matched-frequency/125/5.jpeg
diff --git a/...ting/test_data/fake_examples/imagenet_v2/imagenetv2-matched-frequency/42/1.jpeg b/...ting/test_data/fake_examples/imagenet_v2/imagenetv2-matched-frequency/42/1.jpeg
diff --git a/...ting/test_data/fake_examples/imagenet_v2/imagenetv2-matched-frequency/42/2.jpeg b/...ting/test_data/fake_examples/imagenet_v2/imagenetv2-matched-frequency/42/2.jpeg
diff --git a/...ng/test_data/fake_examples/imagenet_v2/imagenetv2-matched-frequency/999/10.jpeg b/...ng/test_data/fake_examples/imagenet_v2/imagenetv2-matched-frequency/999/10.jpeg
diff --git a/...ing/test_data/fake_examples/imagenet_v2/imagenetv2-matched-frequency/999/6.jpeg b/...ing/test_data/fake_examples/imagenet_v2/imagenetv2-matched-frequency/999/6.jpeg
diff --git a/...ing/test_data/fake_examples/imagenet_v2/imagenetv2-matched-frequency/999/7.jpeg b/...ing/test_data/fake_examples/imagenet_v2/imagenetv2-matched-frequency/999/7.jpeg
diff --git a/...ing/test_data/fake_examples/imagenet_v2/imagenetv2-matched-frequency/999/8.jpeg b/...ing/test_data/fake_examples/imagenet_v2/imagenetv2-matched-frequency/999/8.jpeg
diff --git a/...ing/test_data/fake_examples/imagenet_v2/imagenetv2-matched-frequency/999/9.jpeg b/...ing/test_data/fake_examples/imagenet_v2/imagenetv2-matched-frequency/999/9.jpeg
diff --git a/.../testing/test_data/fake_examples/imagenet_v2/imagenetv2-threshold0.7/125/3.jpeg b/.../testing/test_data/fake_examples/imagenet_v2/imagenetv2-threshold0.7/125/3.jpeg
diff --git a/.../testing/test_data/fake_examples/imagenet_v2/imagenetv2-threshold0.7/125/4.jpeg b/.../testing/test_data/fake_examples/imagenet_v2/imagenetv2-threshold0.7/125/4.jpeg
diff --git a/.../testing/test_data/fake_examples/imagenet_v2/imagenetv2-threshold0.7/125/5.jpeg b/.../testing/test_data/fake_examples/imagenet_v2/imagenetv2-threshold0.7/125/5.jpeg
diff --git a/...s/testing/test_data/fake_examples/imagenet_v2/imagenetv2-threshold0.7/42/1.jpeg b/...s/testing/test_data/fake_examples/imagenet_v2/imagenetv2-threshold0.7/42/1.jpeg
diff --git a/...s/testing/test_data/fake_examples/imagenet_v2/imagenetv2-threshold0.7/42/2.jpeg b/...s/testing/test_data/fake_examples/imagenet_v2/imagenetv2-threshold0.7/42/2.jpeg
diff --git a/...testing/test_data/fake_examples/imagenet_v2/imagenetv2-threshold0.7/999/10.jpeg b/...testing/test_data/fake_examples/imagenet_v2/imagenetv2-threshold0.7/999/10.jpeg
diff --git a/.../testing/test_data/fake_examples/imagenet_v2/imagenetv2-threshold0.7/999/6.jpeg b/.../testing/test_data/fake_examples/imagenet_v2/imagenetv2-threshold0.7/999/6.jpeg
diff --git a/.../testing/test_data/fake_examples/imagenet_v2/imagenetv2-threshold0.7/999/7.jpeg b/.../testing/test_data/fake_examples/imagenet_v2/imagenetv2-threshold0.7/999/7.jpeg
diff --git a/.../testing/test_data/fake_examples/imagenet_v2/imagenetv2-threshold0.7/999/8.jpeg b/.../testing/test_data/fake_examples/imagenet_v2/imagenetv2-threshold0.7/999/8.jpeg
diff --git a/.../testing/test_data/fake_examples/imagenet_v2/imagenetv2-threshold0.7/999/9.jpeg b/.../testing/test_data/fake_examples/imagenet_v2/imagenetv2-threshold0.7/999/9.jpeg
diff --git a/...ets/testing/test_data/fake_examples/imagenet_v2/imagenetv2-topimages/125/3.jpeg b/...ets/testing/test_data/fake_examples/imagenet_v2/imagenetv2-topimages/125/3.jpeg
diff --git a/...ets/testing/test_data/fake_examples/imagenet_v2/imagenetv2-topimages/125/4.jpeg b/...ets/testing/test_data/fake_examples/imagenet_v2/imagenetv2-topimages/125/4.jpeg
diff --git a/...ets/testing/test_data/fake_examples/imagenet_v2/imagenetv2-topimages/125/5.jpeg b/...ets/testing/test_data/fake_examples/imagenet_v2/imagenetv2-topimages/125/5.jpeg
diff --git a/...sets/testing/test_data/fake_examples/imagenet_v2/imagenetv2-topimages/42/1.jpeg b/...sets/testing/test_data/fake_examples/imagenet_v2/imagenetv2-topimages/42/1.jpeg
diff --git a/...sets/testing/test_data/fake_examples/imagenet_v2/imagenetv2-topimages/42/2.jpeg b/...sets/testing/test_data/fake_examples/imagenet_v2/imagenetv2-topimages/42/2.jpeg
diff --git a/...ts/testing/test_data/fake_examples/imagenet_v2/imagenetv2-topimages/999/10.jpeg b/...ts/testing/test_data/fake_examples/imagenet_v2/imagenetv2-topimages/999/10.jpeg
diff --git a/...ets/testing/test_data/fake_examples/imagenet_v2/imagenetv2-topimages/999/6.jpeg b/...ets/testing/test_data/fake_examples/imagenet_v2/imagenetv2-topimages/999/6.jpeg
diff --git a/...ets/testing/test_data/fake_examples/imagenet_v2/imagenetv2-topimages/999/7.jpeg b/...ets/testing/test_data/fake_examples/imagenet_v2/imagenetv2-topimages/999/7.jpeg
diff --git a/...ets/testing/test_data/fake_examples/imagenet_v2/imagenetv2-topimages/999/8.jpeg b/...ets/testing/test_data/fake_examples/imagenet_v2/imagenetv2-topimages/999/8.jpeg
diff --git a/...ets/testing/test_data/fake_examples/imagenet_v2/imagenetv2-topimages/999/9.jpeg b/...ets/testing/test_data/fake_examples/imagenet_v2/imagenetv2-topimages/999/9.jpeg
diff --git a/tensorflow_datasets/url_checksums/imagenet_v2.txt b/tensorflow_datasets/url_checksums/imagenet_v2.txt
@@ -0,0 +1,3 @@
+https://s3-us-west-2.amazonaws.com/imagenetv2public/imagenetv2-matched-frequency.tar.gz 610406400 74c5e7f40cec17ff19a074812dd08ebb0af43bca62ea85e0bc242941ea06372d
+https://s3-us-west-2.amazonaws.com/imagenetv2public/imagenetv2-threshold0.7.tar.gz 605399040 bf2e2d9b625ae29c6e44982928f36220af62359b74602a995518a06840d0d76e
+https://s3-us-west-2.amazonaws.com/imagenetv2public/imagenetv2-topimages.tar.gz 606351360 1ced1ef684934a84af854658bc8ff9adbbec553631e6eef3535ef816c3d3b98f