Skip to content
Merged
Changes from 1 commit
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
2 changes: 1 addition & 1 deletion src/lighteval/metrics/metrics_sample.py
Original file line number Diff line number Diff line change
Expand Up @@ -926,7 +926,7 @@ def compute(self, sample_ids: list[str], responses: list, formatted_docs: list[D
"""
questions = [formatted_doc.specific["question"] for formatted_doc in formatted_docs]
options = [formatted_doc.choices for formatted_doc in formatted_docs]
golds = [formatted_doc.choices[formatted_doc.gold_index[0]] for formatted_doc in formatted_docs]
golds = [formatted_doc.get_golds() for formatted_doc in formatted_docs]
predictions = [response[0].result[0] for response in responses]

scores, messages, judgements = self.judge.evaluate_answer_batch(questions, predictions, options, golds)
Expand Down
Loading