Skip to content

Addresses #145, based off of @fmassa #526

New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

Closed
wants to merge 1 commit into from
Closed
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
73 changes: 48 additions & 25 deletions torchvision/datasets/folder.py
Original file line number Diff line number Diff line change
Expand Up @@ -32,29 +32,6 @@ def is_image_file(filename):
return has_file_allowed_extension(filename, IMG_EXTENSIONS)


def find_classes(dir):
classes = [d for d in os.listdir(dir) if os.path.isdir(os.path.join(dir, d))]
classes.sort()
class_to_idx = {classes[i]: i for i in range(len(classes))}
return classes, class_to_idx


def make_dataset(dir, class_to_idx, extensions):
images = []
dir = os.path.expanduser(dir)
for target in sorted(os.listdir(dir)):
d = os.path.join(dir, target)
if not os.path.isdir(d):
continue

for root, _, fnames in sorted(os.walk(d)):
for fname in sorted(fnames):
if has_file_allowed_extension(fname, extensions):
path = os.path.join(root, fname)
item = (path, class_to_idx[target])
images.append(item)

return images


class DatasetFolder(data.Dataset):
Expand Down Expand Up @@ -86,8 +63,8 @@ class DatasetFolder(data.Dataset):
"""

def __init__(self, root, loader, extensions, transform=None, target_transform=None):
classes, class_to_idx = find_classes(root)
samples = make_dataset(root, class_to_idx, extensions)
classes, class_to_idx = self._find_classes(root)
samples = self._make_dataset(root, class_to_idx, extensions)
if len(samples) == 0:
raise(RuntimeError("Found 0 files in subfolders of: " + root + "\n"
"Supported extensions are: " + ",".join(extensions)))
Expand All @@ -104,6 +81,52 @@ def __init__(self, root, loader, extensions, transform=None, target_transform=No
self.transform = transform
self.target_transform = target_transform

def _find_classes(dir):
"""
Finds the classes in a dataset directory.

Args:
dir (string): Root directory path.

Returns:
tuple: (classes, class_to_idx) where class_to_idx is a dictionary
"""
classes = [d for d in os.listdir(dir) if os.path.isdir(os.path.join(dir, d))]
classes.sort()
class_to_idx = {classes[i]: i for i in range(len(classes))}
return classes, class_to_idx


def _make_dataset(dir, class_to_idx, extensions):
"""
A generic method for obtaining paths to all data files.

Args:
dir (string): Root directory path.
class_to_idx (dictionary): A mapping of class names to id's.
extensions (list): A list of permitted data file extensions.

Returns:
images: A list of (path, target) per data file.

"""
images = []
dir = os.path.expanduser(dir)
for target in sorted(os.listdir(dir)):
d = os.path.join(dir, target)
if not os.path.isdir(d):
continue

for root, _, fnames in sorted(os.walk(d)):
for fname in sorted(fnames):
if has_file_allowed_extension(fname, extensions):
path = os.path.join(root, fname)
item = (path, class_to_idx[target])
images.append(item)

return images


def __getitem__(self, index):
"""
Args:
Expand Down