pytorch · GdoongMathew · Jun 28, 2025 · Jul 6, 2025 · Jul 13, 2025 · scotts
diff --git a/torchvision/datasets/voc.py b/torchvision/datasets/voc.py
@@ -1,7 +1,7 @@
 import collections
 import os
 from pathlib import Path
-from typing import Any, Callable, Optional, Union
+from typing import Any, Callable, Optional, Tuple, Union
 from xml.etree.ElementTree import Element as ET_Element
 
 try:
@@ -64,6 +64,8 @@ class _VOCBase(VisionDataset):
     _SPLITS_DIR: str
     _TARGET_DIR: str
     _TARGET_FILE_EXT: str
+    _IMAGE_SET: str = "ImageSets"
+    _IMAGE_DIR: str = "JPEGImages"
 
     def __init__(
         self,
@@ -95,24 +97,38 @@ def __init__(
         voc_root = os.path.join(self.root, base_dir)
 
         if download:
-            download_and_extract_archive(self.url, self.root, filename=self.filename, md5=self.md5)
+            self._download(voc_root)
 
-        if not os.path.isdir(voc_root):
+        if not self._check_exists(voc_root):
             raise RuntimeError("Dataset not found or corrupted. You can use download=True to download it")
 
-        splits_dir = os.path.join(voc_root, "ImageSets", self._SPLITS_DIR)
+        splits_dir, image_dir, target_dir = self._voc_subfolders(voc_root)
         split_f = os.path.join(splits_dir, image_set.rstrip("\n") + ".txt")
         with open(os.path.join(split_f)) as f:
             file_names = [x.strip() for x in f.readlines()]
 
-        image_dir = os.path.join(voc_root, "JPEGImages")
         self.images = [os.path.join(image_dir, x + ".jpg") for x in file_names]
 
-        target_dir = os.path.join(voc_root, self._TARGET_DIR)
         self.targets = [os.path.join(target_dir, x + self._TARGET_FILE_EXT) for x in file_names]
 
         assert len(self.images) == len(self.targets)
 
+    def _voc_subfolders(self, voc_root) -> Tuple[str, str, str]:
+        """Returns the subfolders for the VOC dataset."""
+        splits_dir = os.path.join(voc_root, self._IMAGE_SET, self._SPLITS_DIR)
+        image_dir = os.path.join(voc_root, self._IMAGE_DIR)
+        target_dir = os.path.join(voc_root, self._TARGET_DIR)
+        return splits_dir, image_dir, target_dir
+
+    def _download(self, voc_root: str) -> None:
+        if self._check_exists(voc_root):
+            return
+        download_and_extract_archive(self.url, self.root, filename=self.filename, md5=self.md5)
 # check if file is already present locally 
 if check_integrity(fpath, md5): 
     return 
 def calculate_md5(fpath: Union[str, pathlib.Path], chunk_size: int = 1024 * 1024) -> str: 
     # Setting the `usedforsecurity` flag does not change anything about the functionality, but indicates that we are 
     # not using the MD5 checksum for cryptography. This enables its usage in restricted environments like FIPS. Without 
     # it torchvision.datasets is unusable in these environments since we perform a MD5 check everywhere. 
     md5 = hashlib.md5(usedforsecurity=False) 
     with open(fpath, "rb") as f: 
         while chunk := f.read(chunk_size): 
             md5.update(chunk) 
     return md5.hexdigest() 
 # check if file is already present locally 
 if check_integrity(fpath, md5): 
     return 
 def calculate_md5(fpath: Union[str, pathlib.Path], chunk_size: int = 1024 * 1024) -> str: 
     # Setting the `usedforsecurity` flag does not change anything about the functionality, but indicates that we are 
     # not using the MD5 checksum for cryptography. This enables its usage in restricted environments like FIPS. Without 
     # it torchvision.datasets is unusable in these environments since we perform a MD5 check everywhere. 
     md5 = hashlib.md5(usedforsecurity=False) 
     with open(fpath, "rb") as f: 
         while chunk := f.read(chunk_size): 
             md5.update(chunk) 
     return md5.hexdigest() 
+
+    def _check_exists(self, voc_root: str) -> bool:
+        """Check if the dataset exists."""
+        return all(os.path.isdir(d) and len(os.listdir(d)) for d in self._voc_subfolders(voc_root))
+
     def __len__(self) -> int:
         return len(self.images)