Voryoji
/

Shuichi

+# coding=utf-8
+# Lint as: python3
+"""bigbench datasets"""
+from __future__ import absolute_import, division, print_function
+import json
+import os
+import textwrap
+import six
+import datasets
+CITATION = r"""
+@article{srivastava2022beyond,
+  title={Beyond the imitation game: Quantifying and extrapolating the capabilities of language models},
+  author={Srivastava, Aarohi and Rastogi, Abhinav and Rao, Abhishek and Shoeb, Abu Awal Md and Abid, Abubakar and Fisch, Adam and Brown, Adam R and Santoro, Adam and Gupta, Aditya and Garriga-Alonso, Adri{\`a} and others},
+  journal={arXiv preprint arXiv:2206.04615},
+  year={2022}
+}
+"""
+DESCRIPTION = """\
+bigbench json tasks
+"""
+DATA_URL = "https://www.dropbox.com/s/cjdywlalikdb1c6/bigbench.zip?dl=1"
+CONFIGS=['abstract_narrative_understanding',
+ 'anachronisms',
+ 'analogical_similarity',
+ 'analytic_entailment',
+ 'arithmetic',
+ 'ascii_word_recognition',
+ 'authorship_verification',
+ 'auto_categorization',
+ 'auto_debugging',
+ 'bbq_lite_json',
+ 'bridging_anaphora_resolution_barqa',
+ 'causal_judgment',
+ 'cause_and_effect',
+ 'checkmate_in_one',
+ 'chess_state_tracking',
+ 'chinese_remainder_theorem',
+ 'cifar10_classification',
+ 'code_line_description',
+ 'codenames',
+ 'color',
+ 'common_morpheme',
+ 'conceptual_combinations',
+ 'conlang_translation',
+ 'contextual_parametric_knowledge_conflicts',
+ 'crash_blossom',
+ 'crass_ai',
+ 'cryobiology_spanish',
+ 'cryptonite',
+ 'cs_algorithms',
+ 'dark_humor_detection',
+ 'date_understanding',
+ 'disambiguation_qa',
+ 'discourse_marker_prediction',
+ 'disfl_qa',
+ 'dyck_languages',
+ 'elementary_math_qa',
+ 'emoji_movie',
+ 'emojis_emotion_prediction',
+ 'empirical_judgments',
+ 'english_proverbs',
+ 'english_russian_proverbs',
+ 'entailed_polarity',
+ 'entailed_polarity_hindi',
+ 'epistemic_reasoning',
+ 'evaluating_information_essentiality',
+ 'fact_checker',
+ 'fantasy_reasoning',
+ 'few_shot_nlg',
+ 'figure_of_speech_detection',
+ 'formal_fallacies_syllogisms_negation',
+ 'gem',
+ 'gender_inclusive_sentences_german',
+ 'general_knowledge',
+ 'geometric_shapes',
+ 'goal_step_wikihow',
+ 'gre_reading_comprehension',
+ 'hhh_alignment',
+ 'hindi_question_answering',
+ 'hindu_knowledge',
+ 'hinglish_toxicity',
+ 'human_organs_senses',
+ 'hyperbaton',
+ 'identify_math_theorems',
+ 'identify_odd_metaphor',
+ 'implicatures',
+ 'implicit_relations',
+ 'indic_cause_and_effect',
+ 'intent_recognition',
+ 'international_phonetic_alphabet_nli',
+ 'international_phonetic_alphabet_transliterate',
+ 'intersect_geometry',
+ 'irony_identification',
+ 'kanji_ascii',
+ 'kannada',
+ 'key_value_maps',
+ 'known_unknowns',
+ 'language_games',
+ 'language_identification',
+ 'linguistic_mappings',
+ 'linguistics_puzzles',
+ 'list_functions',
+ 'logic_grid_puzzle',
+ 'logical_args',
+ 'logical_deduction',
+ 'logical_fallacy_detection',
+ 'logical_sequence',
+ 'mathematical_induction',
+ 'matrixshapes',
+ 'medical_questions_russian',
+ 'metaphor_boolean',
+ 'metaphor_understanding',
+ 'minute_mysteries_qa',
+ 'misconceptions',
+ 'misconceptions_russian',
+ 'mnist_ascii',
+ 'modified_arithmetic',
+ 'moral_permissibility',
+ 'movie_dialog_same_or_different',
+ 'movie_recommendation',
+ 'mult_data_wrangling',
+ 'navigate',
+ 'nonsense_words_grammar',
+ 'novel_concepts',
+ 'object_counting',
+ 'odd_one_out',
+ 'operators',
+ 'paragraph_segmentation',
+ 'parsinlu_qa',
+ 'parsinlu_reading_comprehension',
+ 'penguins_in_a_table',
+ 'periodic_elements',
+ 'persian_idioms',
+ 'phrase_relatedness',
+ 'physical_intuition',
+ 'physics',
+ 'physics_questions',
+ 'play_dialog_same_or_different',
+ 'polish_sequence_labeling',
+ 'presuppositions_as_nli',
+ 'qa_wikidata',
+ 'question_selection',
+ 'real_or_fake_text',
+ 'reasoning_about_colored_objects',
+ 'repeat_copy_logic',
+ 'rephrase',
+ 'rhyming',
+ 'riddle_sense',
+ 'ruin_names',
+ 'salient_translation_error_detection',
+ 'scientific_press_release',
+ 'semantic_parsing_in_context_sparc',
+ 'semantic_parsing_spider',
+ 'sentence_ambiguity',
+ 'similarities_abstraction',
+ 'simp_turing_concept',
+ 'simple_arithmetic_json',
+ 'simple_arithmetic_json_multiple_choice',
+ 'simple_arithmetic_json_subtasks',
+ 'simple_arithmetic_multiple_targets_json',
+ 'simple_ethical_questions',
+ 'simple_text_editing',
+ 'snarks',
+ 'social_iqa',
+ 'social_support',
+ 'sports_understanding',
+ 'strange_stories',
+ 'strategyqa',
+ 'sufficient_information',
+ 'suicide_risk',
+ 'swahili_english_proverbs',
+ 'swedish_to_german_proverbs',
+ 'symbol_interpretation',
+ 'tellmewhy',
+ 'temporal_sequences',
+ 'tense',
+ 'timedial',
+ 'topical_chat',
+ 'tracking_shuffled_objects',
+ 'understanding_fables',
+ 'undo_permutation',
+ 'unit_conversion',
+ 'unit_interpretation',
+ 'unnatural_in_context_learning',
+ 'vitaminc_fact_verification',
+ 'what_is_the_tao',
+ 'which_wiki_edit',
+ 'winowhy',
+ 'word_sorting',
+ 'word_unscrambling']
+class bigbench_Config(datasets.BuilderConfig):
+    """BuilderConfig for bigbench."""
+    def __init__(
+        self,
+        text_features,
+        label_classes=None,
+        process_label=lambda x: x,
+        **kwargs,
+    ):
+        """BuilderConfig for bigbench.
+        Args:
+          text_features: `dict[string, string]`, map from the name of the feature
+            dict for each text field to the name of the column in the tsv file
+          data_url: `string`, url to download the zip file from
+          data_dir: `string`, the path to the folder containing the tsv files in the
+            downloaded zip
+          citation: `string`, citation for the data set
+          url: `string`, url for information about the data set
+        """
+        super(bigbench_Config, self).__init__(
+            version=datasets.Version("1.0.0", ""), **kwargs
+        )
+        self.text_features = text_features
+        self.data_url = DATA_URL
+        self.data_dir = self.name #os.path.join("bigbench", self.name)
+        self.citation = textwrap.dedent(CITATION)
+        self.description = ""
+        self.url = "https://github.com/google/BIG-bench"
+class bigbench(datasets.GeneratorBasedBuilder):
+    """The General Language Understanding Evaluation (bigbench) benchmark."""
+    BUILDER_CONFIG_CLASS = bigbench_Config
+    BUILDER_CONFIGS = [
+        bigbench_Config(
+            name=name,
+            text_features={"inputs": "inputs"},
+        ) for name in CONFIGS
+    ]
+    def _info(self):
+        features = {
+            "inputs": datasets.Value("string"),
+            "targets": datasets.features.Sequence(datasets.Value("string")),
+            "multiple_choice_targets": datasets.features.Sequence(datasets.Value("string")),
+            "multiple_choice_scores": datasets.features.Sequence(datasets.Value("int32")),
+        }
+        features["idx"] = datasets.Value("int32")
+        return datasets.DatasetInfo(
+            description=DESCRIPTION,
+            features=datasets.Features(features),
+            homepage=self.config.url,
+            citation=self.config.citation + "\n" + CITATION,
+        )
+    def _split_generators(self, dl_manager):
+        dl_dir = dl_manager.download_and_extract(self.config.data_url)
+        data_dir = os.path.join(dl_dir, self.config.data_dir)
+        return [
+            datasets.SplitGenerator(
+                name=datasets.Split.TRAIN,
+                gen_kwargs={
+                    "data_file": os.path.join(data_dir or "", "train.jsonl"),
+                    "split": "train",
+                },
+            ),
+            datasets.SplitGenerator(
+                name=datasets.Split.VALIDATION,
+                gen_kwargs={
+                    "data_file": os.path.join(data_dir or "", "validation.jsonl"),
+                    "split": "validation",
+                },
+            ),
+        ]
+    def _generate_examples(self, data_file,split):
+        """Yields examples."""
+        with open(data_file, "r", encoding="utf-8") as f:
+            for id_, line in enumerate(f):
+                line_dict = json.loads(line)
+                yield id_, line_dict

mmlu.py ADDED Viewed

	@@ -0,0 +1,160 @@

+# coding=utf-8
+# Copyright 2020 The HuggingFace Datasets Authors and the current dataset script contributor.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+import csv
+import datasets
+_CITATION = """\
+@article{hendryckstest2021,
+      title={Measuring Massive Multitask Language Understanding},
+      author={Dan Hendrycks and Collin Burns and Steven Basart and Andy Zou and Mantas Mazeika and Dawn Song and Jacob Steinhardt},
+      journal={Proceedings of the International Conference on Learning Representations (ICLR)},
+      year={2021}
+    }
+"""
+_DESCRIPTION = """\
+This is a massive multitask test consisting of multiple-choice questions from various branches of knowledge, covering 57 tasks including elementary mathematics, US history, computer science, law, and more.
+"""
+_HOMEPAGE = "https://github.com/hendrycks/test"
+_URL = "https://www.dropbox.com/s/nv4z13trkpq80bj/mmlu.tar?dl=1"
+_SUBJECTS = [
+    "abstract_algebra",
+    "anatomy",
+    "astronomy",
+    "business_ethics",
+    "clinical_knowledge",
+    "college_biology",
+    "college_chemistry",
+    "college_computer_science",
+    "college_mathematics",
+    "college_medicine",
+    "college_physics",
+    "computer_security",
+    "conceptual_physics",
+    "econometrics",
+    "electrical_engineering",
+    "elementary_mathematics",
+    "formal_logic",
+    "global_facts",
+    "high_school_biology",
+    "high_school_chemistry",
+    "high_school_computer_science",
+    "high_school_european_history",
+    "high_school_geography",
+    "high_school_government_and_politics",
+    "high_school_macroeconomics",
+    "high_school_mathematics",
+    "high_school_microeconomics",
+    "high_school_physics",
+    "high_school_psychology",
+    "high_school_statistics",
+    "high_school_us_history",
+    "high_school_world_history",
+    "human_aging",
+    "human_sexuality",
+    "international_law",
+    "jurisprudence",
+    "logical_fallacies",
+    "machine_learning",
+    "management",
+    "marketing",
+    "medical_genetics",
+    "miscellaneous",
+    "moral_disputes",
+    "moral_scenarios",
+    "nutrition",
+    "philosophy",
+    "prehistory",
+    "professional_accounting",
+    "professional_law",
+    "professional_medicine",
+    "professional_psychology",
+    "public_relations",
+    "security_studies",
+    "sociology",
+    "us_foreign_policy",
+    "virology",
+    "world_religions",
+]
+class HendrycksTest(datasets.GeneratorBasedBuilder):
+    """Massive multitask MC test consisting of 57 tasks"""
+    BUILDER_CONFIGS = [
+        datasets.BuilderConfig(
+            name=sub, version=datasets.Version("1.0.0"), description=f"Hendrycks Test Subject {sub}"
+        )
+        for sub in _SUBJECTS
+    ]
+    def _info(self):
+        features = datasets.Features(
+            {
+                "question": datasets.Value("string"),
+                "choices": datasets.features.Sequence(datasets.Value("string")),
+                "answer": datasets.features.ClassLabel(num_classes=4, names=["A", "B", "C", "D"]),
+            }
+        )
+        return datasets.DatasetInfo(
+            description=_DESCRIPTION,
+            features=features,
+            homepage=_HOMEPAGE,
+            citation=_CITATION,
+        )
+    def _split_generators(self, dl_manager):
+        """Returns SplitGenerators."""
+        archive = dl_manager.download(_URL)
+        return [
+            datasets.SplitGenerator(
+                name=datasets.Split.TEST,
+                gen_kwargs={"iter_archive": dl_manager.iter_archive(archive), "split": "test"},
+            ),
+            datasets.SplitGenerator(
+                name=datasets.Split.VALIDATION,
+                gen_kwargs={
+                    "iter_archive": dl_manager.iter_archive(archive),
+                    "split": "val",
+                },
+            ),
+            datasets.SplitGenerator(
+                name=datasets.Split("dev"),
+                gen_kwargs={
+                    "iter_archive": dl_manager.iter_archive(archive),
+                    "split": "dev",
+                },
+            ),
+        ]
+    def _generate_examples(self, iter_archive, split):
+        """Yields examples as (key, example) tuples."""
+        n_yielded_files = 0
+        for id_file, (path, file) in enumerate(iter_archive):
+            if f"data/{split}/" in path:
+                if f"{self.config.name}_{split}.csv" in path:
+                    n_yielded_files += 1
+                    lines = (line.decode("utf-8") for line in file)
+                    reader = csv.reader(lines)
+                    for id_line, data in enumerate(reader):
+                        yield f"{id_file}_{id_line}", {"question": data[0], "choices": data[1:5], "answer": data[5]}
+                    break