Skip to content

Commit

Permalink
Update run entries config for Nova (#3235)
Browse files Browse the repository at this point in the history
  • Loading branch information
yifanmai authored Dec 20, 2024
1 parent 6871ecf commit b01f5f6
Showing 1 changed file with 7 additions and 7 deletions.
Original file line number Diff line number Diff line change
Expand Up @@ -9,8 +9,8 @@ entries: [
{description: "narrative_qa:model=text,output_format_instructions=narrative_qa", priority: 1}

# NaturalQuestions
{description: "natural_qa:model=text,mode=openbook_longans,output_format_instructions=natural_qa_short_answer", priority: 1}
{description: "natural_qa:model=text,mode=closedbook,output_format_instructions=natural_qa_short_answer", priority: 1}
{description: "natural_qa:model=text,mode=openbook_longans,output_format_instructions=natural_qa_short_answer_no_prefix", priority: 1}
{description: "natural_qa:model=text,mode=closedbook,output_format_instructions=natural_qa_short_answer_no_prefix", priority: 1}

# OpenbookQA
{description: "commonsense:model=text_code,dataset=openbookqa,method=multiple_choice_joint,output_format_instructions=openbookqa", priority: 1}
Expand All @@ -35,11 +35,11 @@ entries: [
{description: "gsm:model=text_code,stop=none", priority: 2}

# LegalBench
{description: "legalbench:model=text_code,subset=abercrombie,output_format_instructions=legalbench_abercrombie_no_prefix,stop=none", priority: 2}
{description: "legalbench:model=text_code,subset=corporate_lobbying,output_format_instructions=legalbench_yes_or_no_no_prefix,stop=none", priority: 2}
{description: "legalbench:model=text_code,subset=international_citizenship_questions,output_format_instructions=legalbench_yes_or_no_no_prefix,stop=none", priority: 2}
{description: "legalbench:model=text_code,subset=function_of_decision_section,output_format_instructions=legalbench_function_of_decision_section_no_prefix,stop=none", priority: 2}
{description: "legalbench:model=text_code,subset=proa,output_format_instructions=legalbench_yes_or_no_no_prefix,stop=none", priority: 2}
{description: "legalbench:model=text_code,subset=abercrombie,output_format_instructions=legalbench_no_prefix,stop=none", priority: 2}
{description: "legalbench:model=text_code,subset=corporate_lobbying,output_format_instructions=legalbench_no_prefix,stop=none", priority: 2}
{description: "legalbench:model=text_code,subset=international_citizenship_questions,output_format_instructions=legalbench_no_prefix,stop=none", priority: 2}
{description: "legalbench:model=text_code,subset=function_of_decision_section,output_format_instructions=legalbench_no_prefix,stop=none", priority: 2}
{description: "legalbench:model=text_code,subset=proa,output_format_instructions=legalbench_no_prefix,stop=none", priority: 2}

# MedQA
{description: "med_qa:model=text_code,output_format_instructions=med_qa", priority: 2}
Expand Down

0 comments on commit b01f5f6

Please sign in to comment.