From f8bb295394f097ec5db66995c53ab304754fd3ac Mon Sep 17 00:00:00 2001 From: pegah-kh Date: Wed, 16 Oct 2024 19:15:32 +0200 Subject: [PATCH] feature_img_folder_None --- llava/train/train.py | 19 ++++++++++++++++++- 1 file changed, 18 insertions(+), 1 deletion(-) diff --git a/llava/train/train.py b/llava/train/train.py index 477c668b6..85f8e16cf 100644 --- a/llava/train/train.py +++ b/llava/train/train.py @@ -663,11 +663,13 @@ def __init__(self, data_path: str, data_args: DataArguments): super(LazySupervisedDataset, self).__init__() list_data_dict = json.load(open(data_path, "r")) + rank0_print("Formatting inputs...Skip in lazy mode") self.tokenizer = tokenizer self.list_data_dict = list_data_dict self.data_args = data_args + def __len__(self): return len(self.list_data_dict) @@ -698,7 +700,14 @@ def __getitem__(self, i) -> Dict[str, torch.Tensor]: image_file = self.list_data_dict[i]['image'] image_folder = self.data_args.image_folder processor = self.data_args.image_processor - image = Image.open(os.path.join(image_folder, image_file)).convert('RGB') + + if not image_folder==None: + img_path = os.path.join(image_folder, image_file) + else: + img_path = image_file + + + image = Image.open(img_path).convert('RGB') if self.data_args.image_aspect_ratio == 'pad': def expand2square(pil_img, background_color): width, height = pil_img.size @@ -989,3 +998,11 @@ def make_inputs_require_grad(module, input, output): if __name__ == "__main__": train() + + + + + +""" +rsync -avz --exclude='*.out' /home/khayatan/llava/LLaVA/llava/train/train.py uja56bm@jean-zay.idris.fr:/lustre/fswork/projects/rech/lqq/uja56bm/LLaVA/llava/train/ +""" \ No newline at end of file