generated from allenai/python-package-template
-
Notifications
You must be signed in to change notification settings - Fork 39
/
Copy patheval_suite_ppl_val_v3.libsonnet
54 lines (48 loc) · 1.22 KB
/
eval_suite_ppl_val_v3.libsonnet
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
local task_utils = import 'task_utils.libsonnet';
local common_kwargs = {
task_name: "ppl_custom",
task_kwargs: {
keep_all_instance_fields_except: ["text", "tokens"],
detailed_output: true,
},
prediction_kwargs: {
split: "validation",
model_max_length: task_utils.model_max_length,
}
};
// TODO: refactor catwalk's Perplexity task so that it actually uses the s3 path.
// until then, let the path be present in nfs ($EVAL_DATA_PATH).
local data_dir = "olmo-ppl-val-v3/";
local create_task_kwargs(task_names) = [
{
task_kwargs: {
task_rename: "ppl_" + task_name,
files: [data_dir + "/" + task_name + "/val"]
}
}
for task_name in task_names
];
local task_dicts = create_task_kwargs(
[
"m2d2_s2orc_unsplit",
"m2d2_wikipedia_unsplit",
"c4_100_domains",
"pile",
"ice_fixed",
"c4_en",
"mc4",
"4chan_meta_sep",
"manosphere_meta_sep",
"gab",
"twitterAAE_HELM_fixed",
"wikitext_103",
"ptb",
"redpajama",
"falcon-refinedweb",
"dolma-v1_5",
"dolma_100_subreddits"
]
);
{
task_set: task_utils.create_task_set_from_task_dicts("eval_suite", task_dicts, common_kwargs)
}