From 8d6e5d54163f97179c1e48adfd6bcb6942373e60 Mon Sep 17 00:00:00 2001 From: YunyaoZhou Date: Tue, 7 Jan 2025 22:40:36 +0800 Subject: [PATCH] =?UTF-8?q?feat=E2=9C=A8:=20=E5=A2=9E=E5=8A=A0=E5=9B=BE?= =?UTF-8?q?=E5=83=8F=E5=B0=BA=E5=AF=B8=E8=B0=83=E6=95=B4=E9=80=BB=E8=BE=91?= =?UTF-8?q?=E4=BB=A5=E6=94=AF=E6=8C=81=E5=B0=8F=E4=BA=8E28=E7=9A=84?= =?UTF-8?q?=E5=AE=BD=E9=AB=98?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- src/dataset_library/OCRVQADataset.py | 7 +++++++ 1 file changed, 7 insertions(+) diff --git a/src/dataset_library/OCRVQADataset.py b/src/dataset_library/OCRVQADataset.py index 415c3fc..58043c9 100644 --- a/src/dataset_library/OCRVQADataset.py +++ b/src/dataset_library/OCRVQADataset.py @@ -66,6 +66,13 @@ class OCRVQADataset(Dataset): new_width = int(width * ratio) new_height = int(height * ratio) image = image.resize((new_width, new_height), Image.Resampling.BILINEAR) + + if width < 28 or height < 28: + min_size = min(width, height) + ratio = 28 / min_size + 1 + new_width = int(width * ratio) + new_height = int(height * ratio) + image = image.resize((new_width, new_height), Image.Resampling.BILINEAR) question = sample["question"] answer = sample["answer"]