diff --git a/olmo_data/hf_datasets/vera/arc_easy/validation/data-00000-of-00001.arrow b/olmo_data/hf_datasets/vera/arc_easy/validation/data-00000-of-00001.arrow deleted file mode 100644 index bc6687e16..000000000 Binary files a/olmo_data/hf_datasets/vera/arc_easy/validation/data-00000-of-00001.arrow and /dev/null differ diff --git a/olmo_data/hf_datasets/vera/arc_easy/validation/dataset_info.json b/olmo_data/hf_datasets/vera/arc_easy/validation/dataset_info.json deleted file mode 100644 index b8b85ebc9..000000000 --- a/olmo_data/hf_datasets/vera/arc_easy/validation/dataset_info.json +++ /dev/null @@ -1,47 +0,0 @@ -{ - "builder_name": "json", - "citation": "", - "config_name": "default", - "dataset_size": 297720, - "description": "", - "download_checksums": { - "/mmfs1/gscratch/xlab/liujc/c-data/declarative/t5_v2/arc_easy/dev.json": { - "num_bytes": 363938, - "checksum": "057571f1bdd402425a807713951ad550a80e5de5aafa89089c53b87a8359a34c" - } - }, - "download_size": 363938, - "features": { - "golds": { - "feature": { - "dtype": "string", - "_type": "Value" - }, - "_type": "Sequence" - }, - "distractors": { - "feature": { - "dtype": "string", - "_type": "Value" - }, - "_type": "Sequence" - } - }, - "homepage": "", - "license": "", - "size_in_bytes": 661658, - "splits": { - "train": { - "name": "train", - "num_bytes": 297720, - "num_examples": 570, - "dataset_name": "json" - } - }, - "version": { - "version_str": "0.0.0", - "major": 0, - "minor": 0, - "patch": 0 - } -} \ No newline at end of file diff --git a/olmo_data/hf_datasets/vera/arc_easy/validation/state.json b/olmo_data/hf_datasets/vera/arc_easy/validation/state.json deleted file mode 100644 index 26f741265..000000000 --- a/olmo_data/hf_datasets/vera/arc_easy/validation/state.json +++ /dev/null @@ -1,13 +0,0 @@ -{ - "_data_files": [ - { - "filename": "data-00000-of-00001.arrow" - } - ], - "_fingerprint": "ab95dd9080a6fd36", - "_format_columns": null, - "_format_kwargs": {}, - "_format_type": null, - "_output_all_columns": false, - "_split": "train" -} \ No newline at end of file diff --git a/olmo_data/hf_datasets/vera/arc_hard/validation/data-00000-of-00001.arrow b/olmo_data/hf_datasets/vera/arc_hard/validation/data-00000-of-00001.arrow deleted file mode 100644 index c1462355b..000000000 Binary files a/olmo_data/hf_datasets/vera/arc_hard/validation/data-00000-of-00001.arrow and /dev/null differ diff --git a/olmo_data/hf_datasets/vera/arc_hard/validation/dataset_info.json b/olmo_data/hf_datasets/vera/arc_hard/validation/dataset_info.json deleted file mode 100644 index 92200c0e5..000000000 --- a/olmo_data/hf_datasets/vera/arc_hard/validation/dataset_info.json +++ /dev/null @@ -1,47 +0,0 @@ -{ - "builder_name": "json", - "citation": "", - "config_name": "default", - "dataset_size": 185159, - "description": "", - "download_checksums": { - "/mmfs1/gscratch/xlab/liujc/c-data/declarative/t5_v2/arc_hard/dev.json": { - "num_bytes": 219973, - "checksum": "d6c46711b51b6962d35c87fcd1d7e134036e58aac2b9fa9a5a975227a1d07f88" - } - }, - "download_size": 219973, - "features": { - "golds": { - "feature": { - "dtype": "string", - "_type": "Value" - }, - "_type": "Sequence" - }, - "distractors": { - "feature": { - "dtype": "string", - "_type": "Value" - }, - "_type": "Sequence" - } - }, - "homepage": "", - "license": "", - "size_in_bytes": 405132, - "splits": { - "train": { - "name": "train", - "num_bytes": 185159, - "num_examples": 299, - "dataset_name": "json" - } - }, - "version": { - "version_str": "0.0.0", - "major": 0, - "minor": 0, - "patch": 0 - } -} \ No newline at end of file diff --git a/olmo_data/hf_datasets/vera/arc_hard/validation/state.json b/olmo_data/hf_datasets/vera/arc_hard/validation/state.json deleted file mode 100644 index c06c679d1..000000000 --- a/olmo_data/hf_datasets/vera/arc_hard/validation/state.json +++ /dev/null @@ -1,13 +0,0 @@ -{ - "_data_files": [ - { - "filename": "data-00000-of-00001.arrow" - } - ], - "_fingerprint": "3497cef2d55cd31d", - "_format_columns": null, - "_format_kwargs": {}, - "_format_type": null, - "_output_all_columns": false, - "_split": "train" -} \ No newline at end of file diff --git a/olmo_data/hf_datasets/vera/commonsenseqa/validation/data-00000-of-00001.arrow b/olmo_data/hf_datasets/vera/commonsenseqa/validation/data-00000-of-00001.arrow deleted file mode 100644 index 29533d7a4..000000000 Binary files a/olmo_data/hf_datasets/vera/commonsenseqa/validation/data-00000-of-00001.arrow and /dev/null differ diff --git a/olmo_data/hf_datasets/vera/commonsenseqa/validation/dataset_info.json b/olmo_data/hf_datasets/vera/commonsenseqa/validation/dataset_info.json deleted file mode 100644 index 7ec289485..000000000 --- a/olmo_data/hf_datasets/vera/commonsenseqa/validation/dataset_info.json +++ /dev/null @@ -1,47 +0,0 @@ -{ - "builder_name": "json", - "citation": "", - "config_name": "default", - "dataset_size": 481139, - "description": "", - "download_checksums": { - "/mmfs1/gscratch/xlab/liujc/c-data/declarative/t5_v2/commonsenseqa/dev.json": { - "num_bytes": 637367, - "checksum": "7aa1394cedd454abca93141497eb9a34f31120668e3fb4c41735d900d817b5c9" - } - }, - "download_size": 637367, - "features": { - "golds": { - "feature": { - "dtype": "string", - "_type": "Value" - }, - "_type": "Sequence" - }, - "distractors": { - "feature": { - "dtype": "string", - "_type": "Value" - }, - "_type": "Sequence" - } - }, - "homepage": "", - "license": "", - "size_in_bytes": 1118506, - "splits": { - "train": { - "name": "train", - "num_bytes": 481139, - "num_examples": 1221, - "dataset_name": "json" - } - }, - "version": { - "version_str": "0.0.0", - "major": 0, - "minor": 0, - "patch": 0 - } -} \ No newline at end of file diff --git a/olmo_data/hf_datasets/vera/commonsenseqa/validation/state.json b/olmo_data/hf_datasets/vera/commonsenseqa/validation/state.json deleted file mode 100644 index fc3fe753b..000000000 --- a/olmo_data/hf_datasets/vera/commonsenseqa/validation/state.json +++ /dev/null @@ -1,13 +0,0 @@ -{ - "_data_files": [ - { - "filename": "data-00000-of-00001.arrow" - } - ], - "_fingerprint": "48550800ec535043", - "_format_columns": null, - "_format_kwargs": {}, - "_format_type": null, - "_output_all_columns": false, - "_split": "train" -} \ No newline at end of file diff --git a/olmo_data/hf_datasets/vera/physical_iqa/validation/data-00000-of-00001.arrow b/olmo_data/hf_datasets/vera/physical_iqa/validation/data-00000-of-00001.arrow deleted file mode 100644 index 4bb011f31..000000000 Binary files a/olmo_data/hf_datasets/vera/physical_iqa/validation/data-00000-of-00001.arrow and /dev/null differ diff --git a/olmo_data/hf_datasets/vera/physical_iqa/validation/dataset_info.json b/olmo_data/hf_datasets/vera/physical_iqa/validation/dataset_info.json deleted file mode 100644 index 8a81b788a..000000000 --- a/olmo_data/hf_datasets/vera/physical_iqa/validation/dataset_info.json +++ /dev/null @@ -1,47 +0,0 @@ -{ - "builder_name": "json", - "citation": "", - "config_name": "default", - "dataset_size": 500987, - "description": "", - "download_checksums": { - "/mmfs1/gscratch/xlab/liujc/c-data/declarative/t5_v2/physical_iqa/dev.json": { - "num_bytes": 670435, - "checksum": "17906535bd6c130072acb3f47e6d52e74f0ed4c19d03b0a74da1f20688492bd9" - } - }, - "download_size": 670435, - "features": { - "golds": { - "feature": { - "dtype": "string", - "_type": "Value" - }, - "_type": "Sequence" - }, - "distractors": { - "feature": { - "dtype": "string", - "_type": "Value" - }, - "_type": "Sequence" - } - }, - "homepage": "", - "license": "", - "size_in_bytes": 1171422, - "splits": { - "train": { - "name": "train", - "num_bytes": 500987, - "num_examples": 1838, - "dataset_name": "json" - } - }, - "version": { - "version_str": "0.0.0", - "major": 0, - "minor": 0, - "patch": 0 - } -} \ No newline at end of file diff --git a/olmo_data/hf_datasets/vera/physical_iqa/validation/state.json b/olmo_data/hf_datasets/vera/physical_iqa/validation/state.json deleted file mode 100644 index bad03a42f..000000000 --- a/olmo_data/hf_datasets/vera/physical_iqa/validation/state.json +++ /dev/null @@ -1,13 +0,0 @@ -{ - "_data_files": [ - { - "filename": "data-00000-of-00001.arrow" - } - ], - "_fingerprint": "9e546ba9430acfd2", - "_format_columns": null, - "_format_kwargs": {}, - "_format_type": null, - "_output_all_columns": false, - "_split": "train" -} \ No newline at end of file diff --git a/olmo_data/hf_datasets/vera/sciq/validation/data-00000-of-00001.arrow b/olmo_data/hf_datasets/vera/sciq/validation/data-00000-of-00001.arrow deleted file mode 100644 index 6ee0060c6..000000000 Binary files a/olmo_data/hf_datasets/vera/sciq/validation/data-00000-of-00001.arrow and /dev/null differ diff --git a/olmo_data/hf_datasets/vera/sciq/validation/dataset_info.json b/olmo_data/hf_datasets/vera/sciq/validation/dataset_info.json deleted file mode 100644 index bbe4f16f8..000000000 --- a/olmo_data/hf_datasets/vera/sciq/validation/dataset_info.json +++ /dev/null @@ -1,47 +0,0 @@ -{ - "builder_name": "json", - "citation": "", - "config_name": "default", - "dataset_size": 349959, - "description": "", - "download_checksums": { - "/mmfs1/gscratch/xlab/liujc/c-data/declarative/t5_v2/sciq/dev.json": { - "num_bytes": 466237, - "checksum": "f779d17f4509a7514afba665f38d78ceaddbae978f0571857bdd6683f1055755" - } - }, - "download_size": 466237, - "features": { - "golds": { - "feature": { - "dtype": "string", - "_type": "Value" - }, - "_type": "Sequence" - }, - "distractors": { - "feature": { - "dtype": "string", - "_type": "Value" - }, - "_type": "Sequence" - } - }, - "homepage": "", - "license": "", - "size_in_bytes": 816196, - "splits": { - "train": { - "name": "train", - "num_bytes": 349959, - "num_examples": 1000, - "dataset_name": "json" - } - }, - "version": { - "version_str": "0.0.0", - "major": 0, - "minor": 0, - "patch": 0 - } -} \ No newline at end of file diff --git a/olmo_data/hf_datasets/vera/sciq/validation/state.json b/olmo_data/hf_datasets/vera/sciq/validation/state.json deleted file mode 100644 index 05911451d..000000000 --- a/olmo_data/hf_datasets/vera/sciq/validation/state.json +++ /dev/null @@ -1,13 +0,0 @@ -{ - "_data_files": [ - { - "filename": "data-00000-of-00001.arrow" - } - ], - "_fingerprint": "c3ae3fb5751af3a9", - "_format_columns": null, - "_format_kwargs": {}, - "_format_type": null, - "_output_all_columns": false, - "_split": "train" -} \ No newline at end of file diff --git a/olmo_data/hf_datasets/vera/social_iqa/validation/data-00000-of-00001.arrow b/olmo_data/hf_datasets/vera/social_iqa/validation/data-00000-of-00001.arrow deleted file mode 100644 index 208083882..000000000 Binary files a/olmo_data/hf_datasets/vera/social_iqa/validation/data-00000-of-00001.arrow and /dev/null differ diff --git a/olmo_data/hf_datasets/vera/social_iqa/validation/dataset_info.json b/olmo_data/hf_datasets/vera/social_iqa/validation/dataset_info.json deleted file mode 100644 index 90f2022ed..000000000 --- a/olmo_data/hf_datasets/vera/social_iqa/validation/dataset_info.json +++ /dev/null @@ -1,47 +0,0 @@ -{ - "builder_name": "json", - "citation": "", - "config_name": "default", - "dataset_size": 740508, - "description": "", - "download_checksums": { - "/mmfs1/gscratch/xlab/liujc/c-data/declarative/t5_v2/social_iqa/dev.json": { - "num_bytes": 943756, - "checksum": "39bd4e3a695b46f3c9660a7051beee7fbb87a4908608be0c2b6d2c2ac2998259" - } - }, - "download_size": 943756, - "features": { - "golds": { - "feature": { - "dtype": "string", - "_type": "Value" - }, - "_type": "Sequence" - }, - "distractors": { - "feature": { - "dtype": "string", - "_type": "Value" - }, - "_type": "Sequence" - } - }, - "homepage": "", - "license": "", - "size_in_bytes": 1684264, - "splits": { - "train": { - "name": "train", - "num_bytes": 740508, - "num_examples": 1954, - "dataset_name": "json" - } - }, - "version": { - "version_str": "0.0.0", - "major": 0, - "minor": 0, - "patch": 0 - } -} \ No newline at end of file diff --git a/olmo_data/hf_datasets/vera/social_iqa/validation/state.json b/olmo_data/hf_datasets/vera/social_iqa/validation/state.json deleted file mode 100644 index 0dd3ed3f3..000000000 --- a/olmo_data/hf_datasets/vera/social_iqa/validation/state.json +++ /dev/null @@ -1,13 +0,0 @@ -{ - "_data_files": [ - { - "filename": "data-00000-of-00001.arrow" - } - ], - "_fingerprint": "4fcee0ae859d13b4", - "_format_columns": null, - "_format_kwargs": {}, - "_format_type": null, - "_output_all_columns": false, - "_split": "train" -} \ No newline at end of file