From e0bab8a6a42a2a463a3712310fddbf1458841d05 Mon Sep 17 00:00:00 2001 From: Lucas Resck <41991486+lucasresck@users.noreply.github.com> Date: Mon, 11 Nov 2024 15:40:20 +0000 Subject: [PATCH] Remove `blobfile` usage from MMLU Inspired by: https://github.com/openai/simple-evals/pull/4 --- mmlu_eval.py | 3 +-- 1 file changed, 1 insertion(+), 2 deletions(-) diff --git a/mmlu_eval.py b/mmlu_eval.py index 90b8328..9423c66 100644 --- a/mmlu_eval.py +++ b/mmlu_eval.py @@ -7,7 +7,6 @@ import random import re -import blobfile as bf import pandas from . import common @@ -88,7 +87,7 @@ def __init__(self, num_examples: int | None = None, language: str = "EN-US"): url = f"https://openaipublic.blob.core.windows.net/simple-evals/mmlu_{language}.csv" else: url = "https://openaipublic.blob.core.windows.net/simple-evals/mmlu.csv" - df = pandas.read_csv(bf.BlobFile(url)) + df = pandas.read_csv(url) examples = [row.to_dict() for _, row in df.iterrows()] if num_examples: examples = random.Random(0).sample(examples, num_examples)