Skip to content

Commit

Permalink
update task auto scoring
Browse files Browse the repository at this point in the history
  • Loading branch information
JvThunder committed Mar 18, 2024
1 parent bc4e3b4 commit eeac250
Show file tree
Hide file tree
Showing 2 changed files with 26 additions and 0 deletions.
1 change: 1 addition & 0 deletions lmms_eval/tasks/olympiadbench/olympiadbench.yaml
Original file line number Diff line number Diff line change
@@ -1,5 +1,6 @@
group: olympiadbench
task:
- olympiadbench_test
- olympiadbench_test_auto_scoring
metadata:
- version: 0.0
25 changes: 25 additions & 0 deletions lmms_eval/tasks/olympiadbench/olympiadbench_test_auto_scoring.yaml
Original file line number Diff line number Diff line change
@@ -0,0 +1,25 @@
dataset_path: lmms-lab/OlympiadBench
dataset_kwargs:
token: True
task : "olympiadbench_test_auto_scoring"
test_split: test_auto_scoring
output_type: generate_until
doc_to_visual: !function utils.olympiadbench_doc_to_visual
doc_to_text: !function utils.olympiadbench_doc_to_text
doc_to_target: "answer"
generation_kwargs:
until:
- "ASSISTANT:"
max_new_tokens: 1024
temperature: 0
top_p: 0
num_beams: 1
do_sample: false
process_results: !function utils.olympiadbench_process_results
metric_list:
- metric: submission
aggregation: !function utils.olympiadbench_aggregate_results
higher_is_better: true
- metric: exact_match
aggregation: mean
higher_is_better: true

0 comments on commit eeac250

Please sign in to comment.