--- dataset_info: features: - name: image dtype: image - name: text dtype: string - name: source dtype: string - name: filename dtype: string - name: type dtype: string splits: - name: train num_bytes: 35238980155.59 num_examples: 454457 download_size: 35201347836 dataset_size: 35238980155.59 configs: - config_name: default data_files: - split: train path: data/train-* license: mit task_categories: - image-to-text language: - la - fr - it - es - ca - pt - cs - nl - de size_categories: - 100K