From a2e5639fc7d3586d2f5878c7cb5fc93a16fa905e Mon Sep 17 00:00:00 2001 From: Pierre Colle Date: Sat, 17 Feb 2024 07:29:26 +0100 Subject: [PATCH] fix new hf dataset --- .../remote/scheduled/finetune-color-palette-mlp-unweighted.toml | 2 -- .../remote/scheduled/finetune-color-palette-mlp-weighted.toml | 2 -- src/refiners/training_utils/huggingface_datasets.py | 2 +- 3 files changed, 1 insertion(+), 5 deletions(-) diff --git a/configs/remote/scheduled/finetune-color-palette-mlp-unweighted.toml b/configs/remote/scheduled/finetune-color-palette-mlp-unweighted.toml index 750dffd95..06dc844fb 100644 --- a/configs/remote/scheduled/finetune-color-palette-mlp-unweighted.toml +++ b/configs/remote/scheduled/finetune-color-palette-mlp-unweighted.toml @@ -60,7 +60,6 @@ use_gyro_dropout = false hf_repo = "refiners/unsplash-25k-cogvlm-captions" revision = "main" resize_image_max_size = 512 -caption_key = "ai_description" split = "train[200:]" [checkpointing] @@ -71,7 +70,6 @@ use_wandb = true hf_repo = "refiners/unsplash-25k-cogvlm-captions" revision = "main" resize_image_max_size = 512 -caption_key = "ai_description" split = "train[:20]" [evaluation] diff --git a/configs/remote/scheduled/finetune-color-palette-mlp-weighted.toml b/configs/remote/scheduled/finetune-color-palette-mlp-weighted.toml index c485bc27a..1d103f87a 100644 --- a/configs/remote/scheduled/finetune-color-palette-mlp-weighted.toml +++ b/configs/remote/scheduled/finetune-color-palette-mlp-weighted.toml @@ -60,7 +60,6 @@ use_gyro_dropout = false hf_repo = "refiners/unsplash-25k-cogvlm-captions" revision = "main" resize_image_max_size = 512 -caption_key = "ai_description" split = "train[200:]" [checkpointing] @@ -71,7 +70,6 @@ use_wandb = true hf_repo = "refiners/unsplash-25k-cogvlm-captions" revision = "main" resize_image_max_size = 512 -caption_key = "ai_description" split = "train[:20]" [evaluation] diff --git a/src/refiners/training_utils/huggingface_datasets.py b/src/refiners/training_utils/huggingface_datasets.py index 9820371cf..fda1e1616 100644 --- a/src/refiners/training_utils/huggingface_datasets.py +++ b/src/refiners/training_utils/huggingface_datasets.py @@ -29,7 +29,7 @@ def load_hf_dataset( dataset = dataset.map( function=download_image, - input_columns=["url"], + input_columns=["photo_image_url"], fn_kwargs={ "dl_manager": DownloadManager(), },