Skip to content

Commit c73db6e

Browse files
tomvdwThe TensorFlow Datasets Authors
authored andcommitted
Use webvid folder inside of manual dir
PiperOrigin-RevId: 520600362
1 parent 72ec6e0 commit c73db6e

File tree

1 file changed

+6
-2
lines changed

1 file changed

+6
-2
lines changed

tensorflow_datasets/datasets/webvid/webvid_dataset_builder.py

Lines changed: 6 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -135,7 +135,8 @@ class Builder(tfds.core.GeneratorBasedBuilder):
135135
MANUAL_DOWNLOAD_INSTRUCTIONS = """
136136
Follow the download instructions in https://m-bain.github.io/webvid-dataset/
137137
to get the data. Place the csv files and the video directories in
138-
`manual_dir/`, such that mp4 files are placed in `manual_dir/*/*_*/*.mp4`.
138+
`manual_dir/webvid`, such that mp4 files are placed in
139+
`manual_dir/webvid/*/*_*/*.mp4`.
139140
140141
First directory typically being an arbitrary part directory (for sharded
141142
downloading), second directory is the page directory (two numbers around
@@ -218,7 +219,10 @@ def _split_generators(self, dl_manager: tfds.download.DownloadManager):
218219
def get_captions_path(glob):
219220
paths = list(epath.Path(dl_manager.manual_dir).glob(glob))
220221
if len(paths) != 1:
221-
raise ValueError(f'Invalid amount of glob results in {paths}.')
222+
raise ValueError(
223+
f'Invalid amount of glob results in {paths} for'
224+
f' {dl_manager.manual_dir}/{glob}.'
225+
)
222226
return paths[0]
223227

224228
return {

0 commit comments

Comments
 (0)