|
44 | 44 | from .GUI.vbgd import VBGD |
45 | 45 | from .GUI.venusbench import VenusBench_GD |
46 | 46 | from .hipho import HiPhODataset |
| 47 | +from .hle import HLEDataset |
47 | 48 | from .image_base import ImageBaseDataset, img_root_map |
48 | 49 | from .image_caption import ImageCaptionDataset |
49 | 50 | from .image_ccocr import CCOCRDataset |
@@ -275,7 +276,7 @@ def evaluate(self, eval_file, **judge_kwargs): |
275 | 276 | HRBenchDataset, CRPE, MathVerse, NaturalBenchDataset, MIABench, |
276 | 277 | OlympiadBench, SeePhys, WildVision, MMMath, QSpatial, Dynamath, GSM8KVDataset, MMGenBench, VizWiz, # noqa: E501 |
277 | 278 | MMNIAH, CMMMU, VLRewardBench, WeMath, LogicVista, MMMUProDataset, |
278 | | - CreationMMBenchDataset, ImageShortQADataset, MMAlignBench, OmniDocBench, |
| 279 | + CreationMMBenchDataset, HLEDataset, ImageShortQADataset, MMAlignBench, OmniDocBench, |
279 | 280 | VLM2Bench, VMCBenchDataset, EMMADataset, MME_CoT, MOAT, MedXpertQA_MM_test, |
280 | 281 | LEGO, MMSci_Captioning, Physics_yale, ScreenSpot_Pro, ScreenSpot, VenusBench_GD, |
281 | 282 | ScreenSpotV2, OSWorld_G, VBGD, MMIFEval, Spatial457, VisuLogic, CVBench, PathVQA_VAL, |
|
0 commit comments