diff --git a/pythia/common/defaults/configs/tasks/vqa/textvqa.yml b/pythia/common/defaults/configs/tasks/vqa/textvqa.yml index 4c7a0176d..fd02983a6 100644 --- a/pythia/common/defaults/configs/tasks/vqa/textvqa.yml +++ b/pythia/common/defaults/configs/tasks/vqa/textvqa.yml @@ -58,7 +58,7 @@ task_attributes: return_info: true # Return OCR information use_ocr: true - # Return spatial information of OCR tokens if present + # Return spatial information of OCR tokens if present (main) use_ocr_info: false training_parameters: monitored_metric: textvqa_vqa_accuracy diff --git a/pythia/tasks/__init__.py b/pythia/tasks/__init__.py index 0e706c849..a7ad48671 100644 --- a/pythia/tasks/__init__.py +++ b/pythia/tasks/__init__.py @@ -5,3 +5,5 @@ from .base_dataset import BaseDataset __all__ = ["BaseTask", "BaseDatasetBuilder", "BaseDataset", "MultiTask"] + +print(" ## Test1 : Checking whether this tasks is getting initialized or not ## ") \ No newline at end of file diff --git a/pythia/tasks/vqa/__init__.py b/pythia/tasks/vqa/__init__.py index a0ae689c9..3bb0dc6b5 100644 --- a/pythia/tasks/vqa/__init__.py +++ b/pythia/tasks/vqa/__init__.py @@ -2,3 +2,5 @@ __all__ = ["VQATask"] from .vqa_task import VQATask + +print(" ## Test2 : Checking whether this vqa_task is getting initialized or not ## ") \ No newline at end of file diff --git a/pythia/tasks/vqa/textvqa/__init__.py b/pythia/tasks/vqa/textvqa/__init__.py index 9020c2df2..adb2bfa51 100644 --- a/pythia/tasks/vqa/textvqa/__init__.py +++ b/pythia/tasks/vqa/textvqa/__init__.py @@ -1 +1,3 @@ # Copyright (c) Facebook, Inc. and its affiliates. + +print(" ## Test3 : Checking whether this textvqa task is getting initialized or not ## ") diff --git a/pythia/tasks/vqa/vqa2/__init__.py b/pythia/tasks/vqa/vqa2/__init__.py index 160ad206c..dde9a66ac 100644 --- a/pythia/tasks/vqa/vqa2/__init__.py +++ b/pythia/tasks/vqa/vqa2/__init__.py @@ -3,3 +3,5 @@ from .builder import VQA2Builder from .dataset import VQA2Dataset + +print(" ## Test4 : Checking whether this vqa2 is getting initialized or not ## ") \ No newline at end of file diff --git a/pythia/tasks/vqa/vqa2/dataset.py b/pythia/tasks/vqa/vqa2/dataset.py index dbe35abdb..fa1da78be 100644 --- a/pythia/tasks/vqa/vqa2/dataset.py +++ b/pythia/tasks/vqa/vqa2/dataset.py @@ -140,6 +140,8 @@ def add_ocr_details(self, sample_info, sample): self.ocr_token_processor({"text": token})["text"] for token in sample_info["ocr_tokens"] ] + print(" ## Test5 : checking for OCR tokens # ") + print(ocr_tokens) # Get embeddings for tokens context = self.context_processor({"tokens": ocr_tokens}) sample.context = context["text"] diff --git a/pythia/tasks/vqa/vqa2/ocr_builder.py b/pythia/tasks/vqa/vqa2/ocr_builder.py index ebc01a155..bd388aadb 100644 --- a/pythia/tasks/vqa/vqa2/ocr_builder.py +++ b/pythia/tasks/vqa/vqa2/ocr_builder.py @@ -6,6 +6,8 @@ @Registry.register_builder("vqa2_ocr") class TextVQABuilder(VizWizBuilder): + print(" ## Test6 : VQA2OCRDataset # ") + #print(ocr_tokens) def __init__(self): super().__init__() self.dataset_name = "VQA2_OCR"