FasterDFlash
/

Hanrui

Model card Files Files and versions

Hanrui / progress /github /SpecForge /benchmarks /benchmarker /financeqa.py

Lekr0's picture

Add files using upload-large-folder tool

212a146 verified 19 days ago

history blame contribute delete

1.62 kB

	from typing import Any, Dict, List, Optional, Tuple

	from datasets import load_dataset

	from .base import Benchmarker
	from .registry import BENCHMARKS
	from .utils import create_simple_sgl_function

	QUESTION_PROMPT = """
	Given the following context:

	{context}

	Can you answer the following question?

	{question}
	""".strip()


	def generate_question(row: Dict[str, Any]) -> str:
	if row["context"] is None:
	return row["question"].strip()
	else:
	question = QUESTION_PROMPT.format(
	context=row["context"].strip(),
	question=row["question"].strip(),
	)
	return question


	@BENCHMARKS.register("financeqa")
	class FinanceQABenchmarker(Benchmarker):
	"""FinanceQA benchmark implementation."""

	def __init__(self, num_samples: Optional[int] = None):
	super().__init__(num_samples, None)

	def load_data(self) -> Tuple[List[Dict[str, Any]], List[int]]:
	"""Load and preprocess FinanceQA dataset."""
	# Read data
	ds = load_dataset("AfterQuery/FinanceQA")["test"]

	questions = []
	labels = []
	for i in range((len(ds))):
	if self.num_samples is not None and i >= self.num_samples:
	break

	question_text = generate_question(ds[i])
	questions.append({"question": question_text})
	labels.append(None)
	return questions, labels

	def create_sgl_function(self):
	return create_simple_sgl_function(
	function_name="get_financeqa_answer",
	answer_key="answer",
	max_tokens=self.get_max_new_tokens(),
	)