from datasets import load_dataset from PIL import Image dataset_name = "image_caption_dataset.py" dataset_config_name = "coco_2017" cache_dir = None keep_in_memory = False data_dir = "./" dataset = load_dataset( dataset_name, dataset_config_name, cache_dir=cache_dir, keep_in_memory=keep_in_memory, data_dir=data_dir ) for example in dataset["train"]: print(example) # with Image.open(example['image_file']) as image: # image.show() break for _idx, example in enumerate(dataset["validation"]): if _idx >= 5: break print(example) with Image.open(example['image_file']) as image: image.show()