Skip to content

Commit e0926c9

Browse files
author
Yue Deng
committed
fix hle text only
1 parent b9527ec commit e0926c9

File tree

2 files changed

+14
-12
lines changed

2 files changed

+14
-12
lines changed

docs/mkdocs/docs/hle_text_only.md

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -9,7 +9,7 @@ More details: [HLE text only Dataset on HuggingFace](https://huggingface.co/data
99
## Dataset Overview
1010

1111
!!! info "HLE Dataset (text only)"
12-
The dataset is a text-only subset of HLE.
12+
The experiments are conducted on the **500 text-only subset** of the HLE dataset, available from [WebThinker](https://github.com/RUC-NLPIR/WebThinker/blob/main/data/HLE/test.json).
1313

1414
---
1515

utils/prepare_benchmark/gen_hle_text_only.py

Lines changed: 13 additions & 11 deletions
Original file line numberDiff line numberDiff line change
@@ -2,29 +2,31 @@
22
#
33
# SPDX-License-Identifier: Apache-2.0
44

5+
6+
import json
57
from typing import Generator, MutableMapping
68

7-
from datasets import load_dataset
9+
import requests
810

911
from utils.prepare_benchmark.common import Task
1012

1113

1214
def gen_hle_text_only(hf_token: str) -> Generator[Task, None, None]:
13-
dataset = load_dataset("macabdul9/hle_text_only", split="test", token=hf_token)
14-
for x in dataset:
15-
metadata: MutableMapping = x # type: ignore
16-
task_id = metadata.pop("id")
17-
question = metadata.pop("question")
18-
gt = metadata.pop("answer")
19-
metadata.pop("image_preview")
20-
metadata.pop("rationale_image")
15+
response = requests.get(
16+
"https://raw.githubusercontent.com/RUC-NLPIR/WebThinker/refs/heads/main/data/HLE/test.json"
17+
)
18+
dataset = json.loads(response.content)
19+
for row in dataset:
20+
metadata: MutableMapping = row
21+
task_id = str(metadata.pop("id", ""))
22+
question = metadata.pop("Question", "")
23+
answer = metadata.pop("answer", "")
2124
task = Task(
2225
task_id=task_id,
2326
task_question=question,
24-
ground_truth=gt,
27+
ground_truth=answer,
2528
file_path=None,
2629
metadata=metadata,
2730
)
2831
yield task
29-
3032
return

0 commit comments

Comments
 (0)