Skip to content

Commit 813b5d2

Browse files
Merge pull request #701 from ChanchalKumarMaji:read-from-archive
PiperOrigin-RevId: 255552399
2 parents 041b65e + 1caadb8 commit 813b5d2

File tree

12 files changed

+14
-24
lines changed

12 files changed

+14
-24
lines changed

tensorflow_datasets/image/downsampled_imagenet.py

Lines changed: 10 additions & 20 deletions
Original file line numberDiff line numberDiff line change
@@ -19,10 +19,6 @@
1919
from __future__ import division
2020
from __future__ import print_function
2121

22-
import os
23-
24-
import tensorflow as tf
25-
2622
from tensorflow_datasets.core import api_utils
2723
import tensorflow_datasets.public_api as tfds
2824

@@ -107,38 +103,32 @@ def _split_generators(self, dl_manager):
107103
train_url = _DL_URL + "train_" + self.builder_config.name + ".tar"
108104
valid_url = _DL_URL + "valid_" + self.builder_config.name + ".tar"
109105

110-
extracted_paths = dl_manager.download_and_extract({
111-
"train_images": train_url,
112-
"valid_images": valid_url,
113-
})
106+
train_path, valid_path = dl_manager.download([
107+
train_url,
108+
valid_url,
109+
])
114110

115111
return [
116112
tfds.core.SplitGenerator(
117113
name=tfds.Split.TRAIN,
118114
num_shards=10,
119115
gen_kwargs={
120-
"path":
121-
os.path.join(extracted_paths["train_images"],
122-
"train_" + self.builder_config.name),
116+
"archive": dl_manager.iter_archive(train_path),
123117
}),
124118
tfds.core.SplitGenerator(
125119
name=tfds.Split.VALIDATION,
126120
num_shards=1,
127121
gen_kwargs={
128-
"path":
129-
os.path.join(extracted_paths["valid_images"],
130-
"valid_" + self.builder_config.name),
122+
"archive": dl_manager.iter_archive(valid_path),
131123
}),
132124
]
133125

134-
def _generate_examples(self, path):
135-
images = tf.io.gfile.listdir(path)
136-
137-
for image in images:
126+
def _generate_examples(self, archive):
127+
for fname, fobj in archive:
138128
record = {
139-
"image": os.path.join(path, image),
129+
"image": fobj,
140130
}
141131
if self.version.implements(tfds.core.Experiment.S3):
142-
yield image, record
132+
yield fname, record
143133
else:
144134
yield record

tensorflow_datasets/image/downsampled_imagenet_test.py

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -34,10 +34,10 @@ class DownsampledImagenetTest(testing.DatasetBuilderTestCase):
3434
tfds.Split.VALIDATION: 2,
3535
}
3636

37-
DL_EXTRACT_RESULT = {
38-
"train_images": "train_images",
39-
"valid_images": "valid_images",
40-
}
37+
DL_EXTRACT_RESULT = [
38+
"train_32x32.tar",
39+
"valid_32x32.tar",
40+
]
4141

4242

4343
class DownsampledImagenetS3Test(DownsampledImagenetTest):

0 commit comments

Comments
 (0)