-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathpost-hoc_runs.txt
24 lines (24 loc) · 3.76 KB
/
post-hoc_runs.txt
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
description='post-hoc' task=qasper model=gpt-4-turbo-128k use_dev_as_test_data=False required_aspects=answer_only use_first_n_test_instances=100
description='post-hoc' task=natural_questions model=gpt-4-turbo-128k use_dev_as_test_data=False required_aspects=answer_only use_first_n_test_instances=100
description='post-hoc' task=evidence_inference model=gpt-4-turbo-128k use_dev_as_test_data=False required_aspects=answer_only use_first_n_test_instances=100
description='post-hoc' task=wice model=gpt-4-turbo-128k use_dev_as_test_data=False required_aspects=answer_only use_first_n_test_instances=100
description='post-hoc' task=contract_nli model=gpt-4-turbo-128k use_dev_as_test_data=False required_aspects=answer_only use_first_n_test_instances=100
description='post-hoc' task=govreport model=gpt-4-turbo-128k use_dev_as_test_data=False required_aspects=answer_only use_first_n_test_instances=100
description='post-hoc' task=qasper model=gpt-35-turbo-0613 use_dev_as_test_data=False required_aspects=answer_only use_first_n_test_instances=2000
description='post-hoc' task=natural_questions model=gpt-35-turbo-0613 use_dev_as_test_data=False required_aspects=answer_only use_first_n_test_instances=2000
description='post-hoc' task=evidence_inference model=gpt-35-turbo-0613 use_dev_as_test_data=False required_aspects=answer_only use_first_n_test_instances=2000
description='post-hoc' task=wice model=gpt-35-turbo-0613 use_dev_as_test_data=False required_aspects=answer_only use_first_n_test_instances=2000
description='post-hoc' task=contract_nli model=gpt-35-turbo-0613 use_dev_as_test_data=False required_aspects=answer_only use_first_n_test_instances=2000
description='post-hoc' task=govreport model=gpt-35-turbo-0613 use_dev_as_test_data=False required_aspects=answer_only use_first_n_test_instances=2000
description='post-hoc' task=qasper model=longchat-7b-v1.5-32k use_dev_as_test_data=False required_aspects=answer_only use_first_n_test_instances=2000
description='post-hoc' task=natural_questions model=longchat-7b-v1.5-32k use_dev_as_test_data=False required_aspects=answer_only use_first_n_test_instances=2000
description='post-hoc' task=evidence_inference model=longchat-7b-v1.5-32k use_dev_as_test_data=False required_aspects=answer_only use_first_n_test_instances=2000
description='post-hoc' task=wice model=longchat-7b-v1.5-32k use_dev_as_test_data=False required_aspects=answer_only use_first_n_test_instances=2000
description='post-hoc' task=contract_nli model=longchat-7b-v1.5-32k use_dev_as_test_data=False required_aspects=answer_only use_first_n_test_instances=2000
description='post-hoc' task=govreport model=longchat-7b-v1.5-32k use_dev_as_test_data=False required_aspects=answer_only use_first_n_test_instances=2000
description='TODO_post-hoc' task=qasper model=flan-t5-xl use_dev_as_test_data=False required_aspects=answer_only use_first_n_test_instances=2000 load_model=True hash_to_load=TODO
description='TODO_post-hoc' task=natural_questions model=flan-t5-xl use_dev_as_test_data=False required_aspects=answer_only use_first_n_test_instances=2000 load_model=True hash_to_load=TODO
description='TODO_post-hoc' task=evidence_inference model=flan-t5-xl use_dev_as_test_data=False required_aspects=answer_only use_first_n_test_instances=2000 load_model=True hash_to_load=TODO
description='TODO_post-hoc' task=wice model=flan-t5-xl use_dev_as_test_data=False required_aspects=answer_only use_first_n_test_instances=2000 load_model=True hash_to_load=TODO
description='TODO_post-hoc' task=contract_nli model=flan-t5-xl use_dev_as_test_data=False required_aspects=answer_only use_first_n_test_instances=2000 load_model=True hash_to_load=TODO
description='TODO_post-hoc' task=govreport model=flan-t5-xl use_dev_as_test_data=False required_aspects=answer_only use_first_n_test_instances=2000 load_model=True hash_to_load=TODO