[
  {
    "path": ".github/scripts/release.py",
    "content": "#!/usr/bin/env python3\nimport json\nimport subprocess\n\n\ndef get_last_version() -> str:\n    \"\"\"Return the version number of the last release.\"\"\"\n    json_string = (\n        subprocess.run(\n            [\"gh\", \"release\", \"view\", \"--json\", \"tagName\"],\n            check=True,\n            stdout=subprocess.PIPE,\n            stderr=subprocess.PIPE,\n        )\n        .stdout.decode(\"utf8\")\n        .strip()\n    )\n\n    return json.loads(json_string)[\"tagName\"]\n\n\ndef bump_patch_number(version_number: str) -> str:\n    \"\"\"Return a copy of `version_number` with the patch number incremented.\"\"\"\n    major, minor, patch = version_number.split(\".\")\n    return f\"{major}.{minor}.{int(patch) + 1}\"\n\n\ndef create_new_patch_release():\n    \"\"\"Create a new patch release on GitHub.\"\"\"\n    try:\n        last_version_number = get_last_version()\n    except subprocess.CalledProcessError as err:\n        if err.stderr.decode(\"utf8\").startswith(\"HTTP 404:\"):\n            # The project doesn't have any releases yet.\n            new_version_number = \"0.0.1\"\n        else:\n            raise\n    else:\n        new_version_number = bump_patch_number(last_version_number)\n\n    subprocess.run(\n        [\"gh\", \"release\", \"create\", \"--generate-notes\", new_version_number],\n        check=True,\n    )\n\n\nif __name__ == \"__main__\":\n    create_new_patch_release()\n"
  },
  {
    "path": ".github/workflows/python-publish.yml",
    "content": "name: Publish to PyPI.org\non:\n  release:\n    types: [published]\njobs:\n  pypi:\n    runs-on: ubuntu-latest\n    steps:\n      - name: Checkout\n        uses: actions/checkout@v3\n        with:\n          fetch-depth: 0\n      - run: python3 -m pip install --upgrade build && python3 -m build\n      - name: Publish package\n        uses: pypa/gh-action-pypi-publish@release/v1\n        with:\n          password: ${{ secrets.PYPI_API_TOKEN }}\n"
  },
  {
    "path": ".github/workflows/release.yml",
    "content": "name: Create a new patch release\non: workflow_dispatch\njobs:\n  github:\n    runs-on: ubuntu-latest\n    steps:\n      - name: Checkout\n        uses: actions/checkout@v3\n      - name: Create new patch release\n        run: .github/scripts/release.py\n        env:\n          GITHUB_TOKEN: ${{ secrets.PERSONAL_ACCESS_TOKEN }}\n"
  },
  {
    "path": ".gitignore",
    "content": "# Byte-compiled / optimized / DLL files\n__pycache__/\n*.py[cod]\n\n# C extensions\n*.so\n\n# Distribution / packaging\n.Python\nenv/\nbuild/\ndevelop-eggs/\ndist/\ndownloads/\neggs/\n.eggs/\nlib/\nlib64/\nparts/\nsdist/\nvar/\n*.egg-info/\n.installed.cfg\n*.egg\n\n# PyInstaller\n#  Usually these files are written by a python script from a template\n#  before PyInstaller builds the exe, so as to inject date/other infos into it.\n*.manifest\n*.spec\n\n# Installer logs\npip-log.txt\npip-delete-this-directory.txt\n\n# Unit test / coverage reports\nhtmlcov/\n.tox/\n.coverage\n.coverage.*\n.cache\nnosetests.xml\ncoverage.xml\n*,cover\n\n# Translations\n*.mo\n*.pot\n\n# Django stuff:\n*.log\n\n# Sphinx documentation\ndocs/_build/\n\n# PyBuilder\ntarget/\n"
  },
  {
    "path": "CITATION.cff",
    "content": "cff-version: 1.1.0\nmessage: \"If you use this work, please cite it as below.\"\nauthors:\n  - family-names: \"Sileo\"\n    given-names: \"Damien\"\ntitle: \"tasksource: A Dataset Harmonization Framework for Streamlined NLP Multi-Task Learning and Evaluation\"\nversion: \"1.0.0\"\ndate-released: 2023-01-01\nurl: \"https://arxiv.org/abs/2301.05948\"\n"
  },
  {
    "path": "LICENSE",
    "content": "Attribution 4.0 International\n\n=======================================================================\n\nCreative Commons Corporation (\"Creative Commons\") is not a law firm and\ndoes not provide legal services or legal advice. Distribution of\nCreative Commons public licenses does not create a lawyer-client or\nother relationship. Creative Commons makes its licenses and related\ninformation available on an \"as-is\" basis. Creative Commons gives no\nwarranties regarding its licenses, any material licensed under their\nterms and conditions, or any related information. Creative Commons\ndisclaims all liability for damages resulting from their use to the\nfullest extent possible.\n\nUsing Creative Commons Public Licenses\n\nCreative Commons public licenses provide a standard set of terms and\nconditions that creators and other rights holders may use to share\noriginal works of authorship and other material subject to copyright\nand certain other rights specified in the public license below. The\nfollowing considerations are for informational purposes only, are not\nexhaustive, and do not form part of our licenses.\n\n     Considerations for licensors: Our public licenses are\n     intended for use by those authorized to give the public\n     permission to use material in ways otherwise restricted by\n     copyright and certain other rights. Our licenses are\n     irrevocable. Licensors should read and understand the terms\n     and conditions of the license they choose before applying it.\n     Licensors should also secure all rights necessary before\n     applying our licenses so that the public can reuse the\n     material as expected. Licensors should clearly mark any\n     material not subject to the license. This includes other CC-\n     licensed material, or material used under an exception or\n     limitation to copyright. More considerations for licensors:\n\twiki.creativecommons.org/Considerations_for_licensors\n\n     Considerations for the public: By using one of our public\n     licenses, a licensor grants the public permission to use the\n     licensed material under specified terms and conditions. If\n     the licensor's permission is not necessary for any reason--for\n     example, because of any applicable exception or limitation to\n     copyright--then that use is not regulated by the license. Our\n     licenses grant only permissions under copyright and certain\n     other rights that a licensor has authority to grant. Use of\n     the licensed material may still be restricted for other\n     reasons, including because others have copyright or other\n     rights in the material. A licensor may make special requests,\n     such as asking that all changes be marked or described.\n     Although not required by our licenses, you are encouraged to\n     respect those requests where reasonable. More_considerations\n     for the public:\n\twiki.creativecommons.org/Considerations_for_licensees\n\n=======================================================================\n\nCreative Commons Attribution 4.0 International Public License\n\nBy exercising the Licensed Rights (defined below), You accept and agree\nto be bound by the terms and conditions of this Creative Commons\nAttribution 4.0 International Public License (\"Public License\"). To the\nextent this Public License may be interpreted as a contract, You are\ngranted the Licensed Rights in consideration of Your acceptance of\nthese terms and conditions, and the Licensor grants You such rights in\nconsideration of benefits the Licensor receives from making the\nLicensed Material available under these terms and conditions.\n\n\nSection 1 -- Definitions.\n\n  a. Adapted Material means material subject to Copyright and Similar\n     Rights that is derived from or based upon the Licensed Material\n     and in which the Licensed Material is translated, altered,\n     arranged, transformed, or otherwise modified in a manner requiring\n     permission under the Copyright and Similar Rights held by the\n     Licensor. For purposes of this Public License, where the Licensed\n     Material is a musical work, performance, or sound recording,\n     Adapted Material is always produced where the Licensed Material is\n     synched in timed relation with a moving image.\n\n  b. Adapter's License means the license You apply to Your Copyright\n     and Similar Rights in Your contributions to Adapted Material in\n     accordance with the terms and conditions of this Public License.\n\n  c. Copyright and Similar Rights means copyright and/or similar rights\n     closely related to copyright including, without limitation,\n     performance, broadcast, sound recording, and Sui Generis Database\n     Rights, without regard to how the rights are labeled or\n     categorized. For purposes of this Public License, the rights\n     specified in Section 2(b)(1)-(2) are not Copyright and Similar\n     Rights.\n\n  d. Effective Technological Measures means those measures that, in the\n     absence of proper authority, may not be circumvented under laws\n     fulfilling obligations under Article 11 of the WIPO Copyright\n     Treaty adopted on December 20, 1996, and/or similar international\n     agreements.\n\n  e. Exceptions and Limitations means fair use, fair dealing, and/or\n     any other exception or limitation to Copyright and Similar Rights\n     that applies to Your use of the Licensed Material.\n\n  f. Licensed Material means the artistic or literary work, database,\n     or other material to which the Licensor applied this Public\n     License.\n\n  g. Licensed Rights means the rights granted to You subject to the\n     terms and conditions of this Public License, which are limited to\n     all Copyright and Similar Rights that apply to Your use of the\n     Licensed Material and that the Licensor has authority to license.\n\n  h. Licensor means the individual(s) or entity(ies) granting rights\n     under this Public License.\n\n  i. Share means to provide material to the public by any means or\n     process that requires permission under the Licensed Rights, such\n     as reproduction, public display, public performance, distribution,\n     dissemination, communication, or importation, and to make material\n     available to the public including in ways that members of the\n     public may access the material from a place and at a time\n     individually chosen by them.\n\n  j. Sui Generis Database Rights means rights other than copyright\n     resulting from Directive 96/9/EC of the European Parliament and of\n     the Council of 11 March 1996 on the legal protection of databases,\n     as amended and/or succeeded, as well as other essentially\n     equivalent rights anywhere in the world.\n\n  k. You means the individual or entity exercising the Licensed Rights\n     under this Public License. Your has a corresponding meaning.\n\n\nSection 2 -- Scope.\n\n  a. License grant.\n\n       1. Subject to the terms and conditions of this Public License,\n          the Licensor hereby grants You a worldwide, royalty-free,\n          non-sublicensable, non-exclusive, irrevocable license to\n          exercise the Licensed Rights in the Licensed Material to:\n\n            a. reproduce and Share the Licensed Material, in whole or\n               in part; and\n\n            b. produce, reproduce, and Share Adapted Material.\n\n       2. Exceptions and Limitations. For the avoidance of doubt, where\n          Exceptions and Limitations apply to Your use, this Public\n          License does not apply, and You do not need to comply with\n          its terms and conditions.\n\n       3. Term. The term of this Public License is specified in Section\n          6(a).\n\n       4. Media and formats; technical modifications allowed. The\n          Licensor authorizes You to exercise the Licensed Rights in\n          all media and formats whether now known or hereafter created,\n          and to make technical modifications necessary to do so. The\n          Licensor waives and/or agrees not to assert any right or\n          authority to forbid You from making technical modifications\n          necessary to exercise the Licensed Rights, including\n          technical modifications necessary to circumvent Effective\n          Technological Measures. For purposes of this Public License,\n          simply making modifications authorized by this Section 2(a)\n          (4) never produces Adapted Material.\n\n       5. Downstream recipients.\n\n            a. Offer from the Licensor -- Licensed Material. Every\n               recipient of the Licensed Material automatically\n               receives an offer from the Licensor to exercise the\n               Licensed Rights under the terms and conditions of this\n               Public License.\n\n            b. No downstream restrictions. You may not offer or impose\n               any additional or different terms or conditions on, or\n               apply any Effective Technological Measures to, the\n               Licensed Material if doing so restricts exercise of the\n               Licensed Rights by any recipient of the Licensed\n               Material.\n\n       6. No endorsement. Nothing in this Public License constitutes or\n          may be construed as permission to assert or imply that You\n          are, or that Your use of the Licensed Material is, connected\n          with, or sponsored, endorsed, or granted official status by,\n          the Licensor or others designated to receive attribution as\n          provided in Section 3(a)(1)(A)(i).\n\n  b. Other rights.\n\n       1. Moral rights, such as the right of integrity, are not\n          licensed under this Public License, nor are publicity,\n          privacy, and/or other similar personality rights; however, to\n          the extent possible, the Licensor waives and/or agrees not to\n          assert any such rights held by the Licensor to the limited\n          extent necessary to allow You to exercise the Licensed\n          Rights, but not otherwise.\n\n       2. Patent and trademark rights are not licensed under this\n          Public License.\n\n       3. To the extent possible, the Licensor waives any right to\n          collect royalties from You for the exercise of the Licensed\n          Rights, whether directly or through a collecting society\n          under any voluntary or waivable statutory or compulsory\n          licensing scheme. In all other cases the Licensor expressly\n          reserves any right to collect such royalties.\n\n\nSection 3 -- License Conditions.\n\nYour exercise of the Licensed Rights is expressly made subject to the\nfollowing conditions.\n\n  a. Attribution.\n\n       1. If You Share the Licensed Material (including in modified\n          form), You must:\n\n            a. retain the following if it is supplied by the Licensor\n               with the Licensed Material:\n\n                 i. identification of the creator(s) of the Licensed\n                    Material and any others designated to receive\n                    attribution, in any reasonable manner requested by\n                    the Licensor (including by pseudonym if\n                    designated);\n\n                ii. a copyright notice;\n\n               iii. a notice that refers to this Public License;\n\n                iv. a notice that refers to the disclaimer of\n                    warranties;\n\n                 v. a URI or hyperlink to the Licensed Material to the\n                    extent reasonably practicable;\n\n            b. indicate if You modified the Licensed Material and\n               retain an indication of any previous modifications; and\n\n            c. indicate the Licensed Material is licensed under this\n               Public License, and include the text of, or the URI or\n               hyperlink to, this Public License.\n\n       2. You may satisfy the conditions in Section 3(a)(1) in any\n          reasonable manner based on the medium, means, and context in\n          which You Share the Licensed Material. For example, it may be\n          reasonable to satisfy the conditions by providing a URI or\n          hyperlink to a resource that includes the required\n          information.\n\n       3. If requested by the Licensor, You must remove any of the\n          information required by Section 3(a)(1)(A) to the extent\n          reasonably practicable.\n\n       4. If You Share Adapted Material You produce, the Adapter's\n          License You apply must not prevent recipients of the Adapted\n          Material from complying with this Public License.\n\n\nSection 4 -- Sui Generis Database Rights.\n\nWhere the Licensed Rights include Sui Generis Database Rights that\napply to Your use of the Licensed Material:\n\n  a. for the avoidance of doubt, Section 2(a)(1) grants You the right\n     to extract, reuse, reproduce, and Share all or a substantial\n     portion of the contents of the database;\n\n  b. if You include all or a substantial portion of the database\n     contents in a database in which You have Sui Generis Database\n     Rights, then the database in which You have Sui Generis Database\n     Rights (but not its individual contents) is Adapted Material; and\n\n  c. You must comply with the conditions in Section 3(a) if You Share\n     all or a substantial portion of the contents of the database.\n\nFor the avoidance of doubt, this Section 4 supplements and does not\nreplace Your obligations under this Public License where the Licensed\nRights include other Copyright and Similar Rights.\n\n\nSection 5 -- Disclaimer of Warranties and Limitation of Liability.\n\n  a. UNLESS OTHERWISE SEPARATELY UNDERTAKEN BY THE LICENSOR, TO THE\n     EXTENT POSSIBLE, THE LICENSOR OFFERS THE LICENSED MATERIAL AS-IS\n     AND AS-AVAILABLE, AND MAKES NO REPRESENTATIONS OR WARRANTIES OF\n     ANY KIND CONCERNING THE LICENSED MATERIAL, WHETHER EXPRESS,\n     IMPLIED, STATUTORY, OR OTHER. THIS INCLUDES, WITHOUT LIMITATION,\n     WARRANTIES OF TITLE, MERCHANTABILITY, FITNESS FOR A PARTICULAR\n     PURPOSE, NON-INFRINGEMENT, ABSENCE OF LATENT OR OTHER DEFECTS,\n     ACCURACY, OR THE PRESENCE OR ABSENCE OF ERRORS, WHETHER OR NOT\n     KNOWN OR DISCOVERABLE. WHERE DISCLAIMERS OF WARRANTIES ARE NOT\n     ALLOWED IN FULL OR IN PART, THIS DISCLAIMER MAY NOT APPLY TO YOU.\n\n  b. TO THE EXTENT POSSIBLE, IN NO EVENT WILL THE LICENSOR BE LIABLE\n     TO YOU ON ANY LEGAL THEORY (INCLUDING, WITHOUT LIMITATION,\n     NEGLIGENCE) OR OTHERWISE FOR ANY DIRECT, SPECIAL, INDIRECT,\n     INCIDENTAL, CONSEQUENTIAL, PUNITIVE, EXEMPLARY, OR OTHER LOSSES,\n     COSTS, EXPENSES, OR DAMAGES ARISING OUT OF THIS PUBLIC LICENSE OR\n     USE OF THE LICENSED MATERIAL, EVEN IF THE LICENSOR HAS BEEN\n     ADVISED OF THE POSSIBILITY OF SUCH LOSSES, COSTS, EXPENSES, OR\n     DAMAGES. WHERE A LIMITATION OF LIABILITY IS NOT ALLOWED IN FULL OR\n     IN PART, THIS LIMITATION MAY NOT APPLY TO YOU.\n\n  c. The disclaimer of warranties and limitation of liability provided\n     above shall be interpreted in a manner that, to the extent\n     possible, most closely approximates an absolute disclaimer and\n     waiver of all liability.\n\n\nSection 6 -- Term and Termination.\n\n  a. This Public License applies for the term of the Copyright and\n     Similar Rights licensed here. However, if You fail to comply with\n     this Public License, then Your rights under this Public License\n     terminate automatically.\n\n  b. Where Your right to use the Licensed Material has terminated under\n     Section 6(a), it reinstates:\n\n       1. automatically as of the date the violation is cured, provided\n          it is cured within 30 days of Your discovery of the\n          violation; or\n\n       2. upon express reinstatement by the Licensor.\n\n     For the avoidance of doubt, this Section 6(b) does not affect any\n     right the Licensor may have to seek remedies for Your violations\n     of this Public License.\n\n  c. For the avoidance of doubt, the Licensor may also offer the\n     Licensed Material under separate terms or conditions or stop\n     distributing the Licensed Material at any time; however, doing so\n     will not terminate this Public License.\n\n  d. Sections 1, 5, 6, 7, and 8 survive termination of this Public\n     License.\n\n\nSection 7 -- Other Terms and Conditions.\n\n  a. The Licensor shall not be bound by any additional or different\n     terms or conditions communicated by You unless expressly agreed.\n\n  b. Any arrangements, understandings, or agreements regarding the\n     Licensed Material not stated herein are separate from and\n     independent of the terms and conditions of this Public License.\n\n\nSection 8 -- Interpretation.\n\n  a. For the avoidance of doubt, this Public License does not, and\n     shall not be interpreted to, reduce, limit, restrict, or impose\n     conditions on any use of the Licensed Material that could lawfully\n     be made without permission under this Public License.\n\n  b. To the extent possible, if any provision of this Public License is\n     deemed unenforceable, it shall be automatically reformed to the\n     minimum extent necessary to make it enforceable. If the provision\n     cannot be reformed, it shall be severed from this Public License\n     without affecting the enforceability of the remaining terms and\n     conditions.\n\n  c. No term or condition of this Public License will be waived and no\n     failure to comply consented to unless expressly agreed to by the\n     Licensor.\n\n  d. Nothing in this Public License constitutes or may be interpreted\n     as a limitation upon, or waiver of, any privileges and immunities\n     that apply to the Licensor or You, including from the legal\n     processes of any jurisdiction or authority.\n\n\n=======================================================================\n\nCreative Commons is not a party to its public\nlicenses. Notwithstanding, Creative Commons may elect to apply one of\nits public licenses to material it publishes and in those instances\nwill be considered the “Licensor.” The text of the Creative Commons\npublic licenses is dedicated to the public domain under the CC0 Public\nDomain Dedication. Except for the limited purpose of indicating that\nmaterial is shared under a Creative Commons public license or as\notherwise permitted by the Creative Commons policies published at\ncreativecommons.org/policies, Creative Commons does not authorize the\nuse of the trademark \"Creative Commons\" or any other trademark or logo\nof Creative Commons without its prior written consent including,\nwithout limitation, in connection with any unauthorized modifications\nto any of its public licenses or any other arrangements,\nunderstandings, or agreements concerning use of licensed material. For\nthe avoidance of doubt, this paragraph does not form part of the\npublic licenses.\n\nCreative Commons may be contacted at creativecommons.org.\n"
  },
  {
    "path": "README.md",
    "content": "## tasksource ![](https://aeiljuispo.cloudimg.io/v7/https://s3.amazonaws.com/moonup/production/uploads/5fc0bcb41160c47d1d43856b/j06-U5e2Tifi2xOnTudqS.jpeg?w=20&h=20&f=face) 600+ curated datasets and preprocessings for instant and interchangeable use\n\nHuggingface Datasets is an excellent library, but it lacks standardization, and datasets often require preprocessing work to be used interchangeably.\n`tasksource` streamlines interchangeable datasets usage to scale evaluation or multi-task learning.\n\nEach dataset is standardized to a `MultipleChoice`, `Classification`, or `TokenClassification` template with canonical fields. We focus on discriminative tasks (= with negative examples or classes) for our annotations but also provide a `SequenceToSequence` template. All implemented preprocessings are in [tasks.py](https://github.com/sileod/tasksource/blob/main/src/tasksource/tasks.py) or [tasks.md](https://github.com/sileod/tasksource/blob/main/tasks.md). A preprocessing is a function that accepts a dataset and returns the standardized dataset. Preprocessing code is concise and human-readable.\n\n### Installation and usage:\n`pip install tasksource`\n```python\nfrom tasksource import list_tasks, load_task\ndf = list_tasks(multilingual=False) # takes some time\n\nfor id in df[df.task_type==\"MultipleChoice\"].id:\n    dataset = load_task(id) # all yielded datasets can be used interchangeably\n```\n\nBrowse the 500+ curated tasks in tasks.md (200+ MultipleChoice tasks, 200+ Classification tasks), and feel free to request a new task. Datasets are downloaded to `$HF_DATASETS_CACHE` (like any Hugging Face dataset), so ensure you have more than 100GB of space available.\n\nYou can now also use:\n```python\nload_dataset(\"tasksource/data\", \"glue/rte\",max_rows=30_000)\n```\n\n### Pretrained models:\n\nText encoder pretrained on tasksource reached state-of-the-art results: [🤗/deberta-v3-base-tasksource-nli](https://hf.co/sileod/deberta-v3-base-tasksource-nli)\n\nTasksource pretraining is notably helpful for RLHF reward modeling or any kind of classification, including zero-shot. You can also find a large and a multilingual version.\n\n### tasksource-instruct\n\nThe repo also contains some recasting code to convert tasksource datasets to instructions, providing one of the richest instruction-tuning datasets:\n[🤗/tasksource-instruct-v0](https://hf.co/datasets/tasksource/tasksource-instruct-v0)\n\n\n### tasksource-label-nli\n\nWe also recast all classification tasks as natural language inference, to improve entailment-based zero-shot classification detection:\n[🤗/zero-shot-label-nli](https://huggingface.co/datasets/tasksource/zero-shot-label-nli)\n\n### Write and use custom preprocessings\n\n```python\nfrom tasksource import MultipleChoice\n\ncodah = MultipleChoice('question_propmt',choices_list='candidate_answers',\n    labels='correct_answer_idx',\n    dataset_name='codah', config_name='codah')\n    \nwinogrande = MultipleChoice('sentence',['option1','option2'],'answer',\n    dataset_name='winogrande',config_name='winogrande_xl',\n    splits=['train','validation',None]) # test labels are not usable\n    \ntasks = [winogrande.load(), codah.load()]) #  Aligned datasets (same columns) can be used interchangably  \n```\n\n ### Citation and contact\n\nFor more details, refer to this [article:](https://arxiv.org/abs/2301.05948) \n```bib\n@inproceedings{sileo-2024-tasksource,\n    title = \"tasksource: A Large Collection of {NLP} tasks with a Structured Dataset Preprocessing Framework\",\n    author = \"Sileo, Damien\",\n    booktitle = \"Proceedings of the 2024 Joint International Conference on Computational Linguistics, Language Resources and Evaluation (LREC-COLING 2024)\",\n    month = may,\n    year = \"2024\",\n    address = \"Torino, Italia\",\n    publisher = \"ELRA and ICCL\",\n    url = \"https://aclanthology.org/2024.lrec-main.1361\",\n    pages = \"15655--15684\",\n}\n```\nFor help integrating tasksource into your experiments, please contact [damien.sileo@inria.fr](mailto:damien.sileo@inria.fr).\n\n                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                     \n"
  },
  {
    "path": "mtasks.md",
    "content": "|     | id                                                           | dataset_name                                | config_name                    | task_name   | preprocessing_name      | task_type           |\n|----:|:-------------------------------------------------------------|:--------------------------------------------|:-------------------------------|:------------|:------------------------|:--------------------|\n|   0 | xnli/ru                                                      | metaeval/xnli                               | ru                             |             | xnli                    | Classification      |\n|   1 | xnli/tr                                                      | metaeval/xnli                               | tr                             |             | xnli                    | Classification      |\n|   2 | xnli/ur                                                      | metaeval/xnli                               | ur                             |             | xnli                    | Classification      |\n|   3 | xnli/vi                                                      | metaeval/xnli                               | vi                             |             | xnli                    | Classification      |\n|   4 | xnli/zh                                                      | metaeval/xnli                               | zh                             |             | xnli                    | Classification      |\n|   5 | xnli/hi                                                      | metaeval/xnli                               | hi                             |             | xnli                    | Classification      |\n|   6 | xnli/fr                                                      | metaeval/xnli                               | fr                             |             | xnli                    | Classification      |\n|   7 | xnli/es                                                      | metaeval/xnli                               | es                             |             | xnli                    | Classification      |\n|   8 | xnli/en                                                      | metaeval/xnli                               | en                             |             | xnli                    | Classification      |\n|   9 | xnli/el                                                      | metaeval/xnli                               | el                             |             | xnli                    | Classification      |\n|  10 | xnli/de                                                      | metaeval/xnli                               | de                             |             | xnli                    | Classification      |\n|  11 | xnli/bg                                                      | metaeval/xnli                               | bg                             |             | xnli                    | Classification      |\n|  12 | xnli/ar                                                      | metaeval/xnli                               | ar                             |             | xnli                    | Classification      |\n|  13 | xnli/th                                                      | metaeval/xnli                               | th                             |             | xnli                    | Classification      |\n|  14 | xnli/sw                                                      | metaeval/xnli                               | sw                             |             | xnli                    | Classification      |\n|  15 | americas_nli/all_languages                                   | americas_nli                                | all_languages                  |             | americas_nli            | Classification      |\n|  16 | multilingual-NLI-26lang-2mil7/MoritzLaurer--multilingual_nli | MoritzLaurer/multilingual-NLI-26lang-2mil7  | MoritzLaurer--multilingual_nli |             | moritz_xnli             | Classification      |\n|  17 | stsb_multi_mt/en                                             | stsb_multi_mt                               | en                             |             | stsb_multi_mt           | Classification      |\n|  18 | stsb_multi_mt/fr                                             | stsb_multi_mt                               | fr                             |             | stsb_multi_mt           | Classification      |\n|  19 | stsb_multi_mt/de                                             | stsb_multi_mt                               | de                             |             | stsb_multi_mt           | Classification      |\n|  20 | stsb_multi_mt/es                                             | stsb_multi_mt                               | es                             |             | stsb_multi_mt           | Classification      |\n|  21 | stsb_multi_mt/it                                             | stsb_multi_mt                               | it                             |             | stsb_multi_mt           | Classification      |\n|  22 | stsb_multi_mt/nl                                             | stsb_multi_mt                               | nl                             |             | stsb_multi_mt           | Classification      |\n|  23 | stsb_multi_mt/pl                                             | stsb_multi_mt                               | pl                             |             | stsb_multi_mt           | Classification      |\n|  24 | stsb_multi_mt/pt                                             | stsb_multi_mt                               | pt                             |             | stsb_multi_mt           | Classification      |\n|  25 | stsb_multi_mt/ru                                             | stsb_multi_mt                               | ru                             |             | stsb_multi_mt           | Classification      |\n|  26 | stsb_multi_mt/zh                                             | stsb_multi_mt                               | zh                             |             | stsb_multi_mt           | Classification      |\n|  27 | paws-x/zh                                                    | paws-x                                      | zh                             |             | pawsx                   | Classification      |\n|  28 | paws-x/ja                                                    | paws-x                                      | ja                             |             | pawsx                   | Classification      |\n|  29 | paws-x/ko                                                    | paws-x                                      | ko                             |             | pawsx                   | Classification      |\n|  30 | paws-x/en                                                    | paws-x                                      | en                             |             | pawsx                   | Classification      |\n|  31 | paws-x/de                                                    | paws-x                                      | de                             |             | pawsx                   | Classification      |\n|  32 | paws-x/es                                                    | paws-x                                      | es                             |             | pawsx                   | Classification      |\n|  33 | paws-x/fr                                                    | paws-x                                      | fr                             |             | pawsx                   | Classification      |\n|  34 | miam/vm2                                                     | miam                                        | vm2                            |             | miam                    | Classification      |\n|  35 | miam/maptask                                                 | miam                                        | maptask                        |             | miam                    | Classification      |\n|  36 | miam/loria                                                   | miam                                        | loria                          |             | miam                    | Classification      |\n|  37 | miam/dihana                                                  | miam                                        | dihana                         |             | miam                    | Classification      |\n|  38 | miam/ilisten                                                 | miam                                        | ilisten                        |             | miam                    | Classification      |\n|  39 | x-stance/fr                                                  | strombergnlp/x-stance                       | fr                             |             | xstance                 | Classification      |\n|  40 | x-stance/de                                                  | strombergnlp/x-stance                       | de                             |             | xstance                 | Classification      |\n|  41 | offenseval_2020/da                                           | strombergnlp/offenseval_2020                | da                             |             | offenseval              | Classification      |\n|  42 | offenseval_2020/tr                                           | strombergnlp/offenseval_2020                | tr                             |             | offenseval              | Classification      |\n|  43 | offenseval_2020/gr                                           | strombergnlp/offenseval_2020                | gr                             |             | offenseval              | Classification      |\n|  44 | offenseval_2020/ar                                           | strombergnlp/offenseval_2020                | ar                             |             | offenseval              | Classification      |\n|  45 | offenseval_dravidian/tamil                                   | offenseval_dravidian                        | tamil                          |             | offenseval_dravidian    | Classification      |\n|  46 | offenseval_dravidian/malayalam                               | offenseval_dravidian                        | malayalam                      |             | offenseval_dravidian    | Classification      |\n|  47 | offenseval_dravidian/kannada                                 | offenseval_dravidian                        | kannada                        |             | offenseval_dravidian    | Classification      |\n|  48 | MLMA_hate_speech                                             | nedjmaou/MLMA_hate_speech                   |                                |             | mlma_hate               | Classification      |\n|  49 | xglue/qam                                                    | xglue                                       | qam                            |             | qam                     | Classification      |\n|  50 | x-fact                                                       | metaeval/x-fact                             |                                |             | x_fact                  | Classification      |\n|  51 | xglue/nc                                                     | xglue                                       | nc                             |             | xglue___nc              | Classification      |\n|  52 | xglue/qadsm                                                  | xglue                                       | qadsm                          |             | xglue___qadsm           | Classification      |\n|  53 | xglue/qam                                                    | xglue                                       | qam                            |             | xglue___qam             | Classification      |\n|  54 | xglue/wpr                                                    | xglue                                       | wpr                            |             | xglue___wpr             | Classification      |\n|  55 | xlwic/xlwic_fr_fr                                            | pasinit/xlwic                               | xlwic_fr_fr                    |             | xlwic                   | Classification      |\n|  56 | xlwic/xlwic_en_ko                                            | pasinit/xlwic                               | xlwic_en_ko                    |             | xlwic                   | Classification      |\n|  57 | xlwic/xlwic_it_it                                            | pasinit/xlwic                               | xlwic_it_it                    |             | xlwic                   | Classification      |\n|  58 | xlwic/xlwic_de_de                                            | pasinit/xlwic                               | xlwic_de_de                    |             | xlwic                   | Classification      |\n|  59 | oasst1_dense_flat/quality                                    | tasksource/oasst1_dense_flat                |                                | quality     | oasst1__quality         | Classification      |\n|  60 | oasst1_dense_flat/toxicity                                   | tasksource/oasst1_dense_flat                |                                | toxicity    | oasst1__toxicity        | Classification      |\n|  61 | oasst1_dense_flat/helpfulness                                | tasksource/oasst1_dense_flat                |                                | helpfulness | oasst1__helpfulness     | Classification      |\n|  62 | language-identification                                      | papluca/language-identification             |                                |             | language_identification | Classification      |\n|  63 | wili_2018                                                    | wili_2018                                   |                                |             | wili_2018_langid        | Classification      |\n|  64 | exams/multilingual                                           | exams                                       | multilingual                   |             | exams                   | MultipleChoice      |\n|  65 | xcsr/X-CSQA-ar                                               | xcsr                                        | X-CSQA-ar                      |             | xcsr                    | MultipleChoice      |\n|  66 | xcsr/X-CODAH-zh                                              | xcsr                                        | X-CODAH-zh                     |             | xcsr                    | MultipleChoice      |\n|  67 | xcsr/X-CODAH-de                                              | xcsr                                        | X-CODAH-de                     |             | xcsr                    | MultipleChoice      |\n|  68 | xcsr/X-CSQA-ru                                               | xcsr                                        | X-CSQA-ru                      |             | xcsr                    | MultipleChoice      |\n|  69 | xcsr/X-CODAH-fr                                              | xcsr                                        | X-CODAH-fr                     |             | xcsr                    | MultipleChoice      |\n|  70 | xcsr/X-CODAH-it                                              | xcsr                                        | X-CODAH-it                     |             | xcsr                    | MultipleChoice      |\n|  71 | xcsr/X-CODAH-jap                                             | xcsr                                        | X-CODAH-jap                    |             | xcsr                    | MultipleChoice      |\n|  72 | xcsr/X-CODAH-nl                                              | xcsr                                        | X-CODAH-nl                     |             | xcsr                    | MultipleChoice      |\n|  73 | xcsr/X-CODAH-pt                                              | xcsr                                        | X-CODAH-pt                     |             | xcsr                    | MultipleChoice      |\n|  74 | xcsr/X-CODAH-en                                              | xcsr                                        | X-CODAH-en                     |             | xcsr                    | MultipleChoice      |\n|  75 | xcsr/X-CODAH-ru                                              | xcsr                                        | X-CODAH-ru                     |             | xcsr                    | MultipleChoice      |\n|  76 | xcsr/X-CODAH-ar                                              | xcsr                                        | X-CODAH-ar                     |             | xcsr                    | MultipleChoice      |\n|  77 | xcsr/X-CODAH-vi                                              | xcsr                                        | X-CODAH-vi                     |             | xcsr                    | MultipleChoice      |\n|  78 | xcsr/X-CODAH-hi                                              | xcsr                                        | X-CODAH-hi                     |             | xcsr                    | MultipleChoice      |\n|  79 | xcsr/X-CODAH-sw                                              | xcsr                                        | X-CODAH-sw                     |             | xcsr                    | MultipleChoice      |\n|  80 | xcsr/X-CODAH-ur                                              | xcsr                                        | X-CODAH-ur                     |             | xcsr                    | MultipleChoice      |\n|  81 | xcsr/X-CODAH-pl                                              | xcsr                                        | X-CODAH-pl                     |             | xcsr                    | MultipleChoice      |\n|  82 | xcsr/X-CSQA-ur                                               | xcsr                                        | X-CSQA-ur                      |             | xcsr                    | MultipleChoice      |\n|  83 | xcsr/X-CODAH-es                                              | xcsr                                        | X-CODAH-es                     |             | xcsr                    | MultipleChoice      |\n|  84 | xcsr/X-CSQA-pt                                               | xcsr                                        | X-CSQA-pt                      |             | xcsr                    | MultipleChoice      |\n|  85 | xcsr/X-CSQA-vi                                               | xcsr                                        | X-CSQA-vi                      |             | xcsr                    | MultipleChoice      |\n|  86 | xcsr/X-CSQA-hi                                               | xcsr                                        | X-CSQA-hi                      |             | xcsr                    | MultipleChoice      |\n|  87 | xcsr/X-CSQA-pl                                               | xcsr                                        | X-CSQA-pl                      |             | xcsr                    | MultipleChoice      |\n|  88 | xcsr/X-CSQA-sw                                               | xcsr                                        | X-CSQA-sw                      |             | xcsr                    | MultipleChoice      |\n|  89 | xcsr/X-CSQA-nl                                               | xcsr                                        | X-CSQA-nl                      |             | xcsr                    | MultipleChoice      |\n|  90 | xcsr/X-CSQA-jap                                              | xcsr                                        | X-CSQA-jap                     |             | xcsr                    | MultipleChoice      |\n|  91 | xcsr/X-CSQA-it                                               | xcsr                                        | X-CSQA-it                      |             | xcsr                    | MultipleChoice      |\n|  92 | xcsr/X-CSQA-es                                               | xcsr                                        | X-CSQA-es                      |             | xcsr                    | MultipleChoice      |\n|  93 | xcsr/X-CSQA-fr                                               | xcsr                                        | X-CSQA-fr                      |             | xcsr                    | MultipleChoice      |\n|  94 | xcsr/X-CSQA-zh                                               | xcsr                                        | X-CSQA-zh                      |             | xcsr                    | MultipleChoice      |\n|  95 | xcsr/X-CSQA-en                                               | xcsr                                        | X-CSQA-en                      |             | xcsr                    | MultipleChoice      |\n|  96 | xcsr/X-CSQA-de                                               | xcsr                                        | X-CSQA-de                      |             | xcsr                    | MultipleChoice      |\n|  97 | xcopa/qu                                                     | xcopa                                       | qu                             |             | xcopa                   | MultipleChoice      |\n|  98 | xcopa/it                                                     | xcopa                                       | it                             |             | xcopa                   | MultipleChoice      |\n|  99 | xcopa/ht                                                     | xcopa                                       | ht                             |             | xcopa                   | MultipleChoice      |\n| 100 | xcopa/et                                                     | xcopa                                       | et                             |             | xcopa                   | MultipleChoice      |\n| 101 | xcopa/vi                                                     | xcopa                                       | vi                             |             | xcopa                   | MultipleChoice      |\n| 102 | xcopa/id                                                     | xcopa                                       | id                             |             | xcopa                   | MultipleChoice      |\n| 103 | xcopa/translation-et                                         | xcopa                                       | translation-et                 |             | xcopa                   | MultipleChoice      |\n| 104 | xcopa/th                                                     | xcopa                                       | th                             |             | xcopa                   | MultipleChoice      |\n| 105 | xcopa/sw                                                     | xcopa                                       | sw                             |             | xcopa                   | MultipleChoice      |\n| 106 | xcopa/translation-sw                                         | xcopa                                       | translation-sw                 |             | xcopa                   | MultipleChoice      |\n| 107 | xcopa/translation-ht                                         | xcopa                                       | translation-ht                 |             | xcopa                   | MultipleChoice      |\n| 108 | xcopa/translation-it                                         | xcopa                                       | translation-it                 |             | xcopa                   | MultipleChoice      |\n| 109 | xcopa/ta                                                     | xcopa                                       | ta                             |             | xcopa                   | MultipleChoice      |\n| 110 | xcopa/translation-zh                                         | xcopa                                       | translation-zh                 |             | xcopa                   | MultipleChoice      |\n| 111 | xcopa/translation-vi                                         | xcopa                                       | translation-vi                 |             | xcopa                   | MultipleChoice      |\n| 112 | xcopa/translation-id                                         | xcopa                                       | translation-id                 |             | xcopa                   | MultipleChoice      |\n| 113 | xcopa/translation-tr                                         | xcopa                                       | translation-tr                 |             | xcopa                   | MultipleChoice      |\n| 114 | xcopa/translation-th                                         | xcopa                                       | translation-th                 |             | xcopa                   | MultipleChoice      |\n| 115 | xcopa/translation-ta                                         | xcopa                                       | translation-ta                 |             | xcopa                   | MultipleChoice      |\n| 116 | xcopa/zh                                                     | xcopa                                       | zh                             |             | xcopa                   | MultipleChoice      |\n| 117 | xcopa/tr                                                     | xcopa                                       | tr                             |             | xcopa                   | MultipleChoice      |\n| 118 | xstory_cloze/eu                                              | juletxara/xstory_cloze                      | eu                             |             | xstory                  | MultipleChoice      |\n| 119 | xstory_cloze/my                                              | juletxara/xstory_cloze                      | my                             |             | xstory                  | MultipleChoice      |\n| 120 | xstory_cloze/te                                              | juletxara/xstory_cloze                      | te                             |             | xstory                  | MultipleChoice      |\n| 121 | xstory_cloze/sw                                              | juletxara/xstory_cloze                      | sw                             |             | xstory                  | MultipleChoice      |\n| 122 | xstory_cloze/en                                              | juletxara/xstory_cloze                      | en                             |             | xstory                  | MultipleChoice      |\n| 123 | xstory_cloze/ru                                              | juletxara/xstory_cloze                      | ru                             |             | xstory                  | MultipleChoice      |\n| 124 | xstory_cloze/zh                                              | juletxara/xstory_cloze                      | zh                             |             | xstory                  | MultipleChoice      |\n| 125 | xstory_cloze/es                                              | juletxara/xstory_cloze                      | es                             |             | xstory                  | MultipleChoice      |\n| 126 | xstory_cloze/ar                                              | juletxara/xstory_cloze                      | ar                             |             | xstory                  | MultipleChoice      |\n| 127 | xstory_cloze/hi                                              | juletxara/xstory_cloze                      | hi                             |             | xstory                  | MultipleChoice      |\n| 128 | xstory_cloze/id                                              | juletxara/xstory_cloze                      | id                             |             | xstory                  | MultipleChoice      |\n| 129 | xglue/ner                                                    | xglue                                       | ner                            |             | xglue_ner               | TokenClassification |\n| 130 | xglue/pos                                                    | xglue                                       | pos                            |             | xglue_pos               | TokenClassification |\n| 131 | universal_dependencies/nyq_aha/pos                           | universal_dependencies                      | nyq_aha                        | pos         | udep__pos               | TokenClassification |\n| 132 | universal_dependencies/sme_giella/pos                        | universal_dependencies                      | sme_giella                     | pos         | udep__pos               | TokenClassification |\n| 133 | universal_dependencies/no_bokmaal/pos                        | universal_dependencies                      | no_bokmaal                     | pos         | udep__pos               | TokenClassification |\n| 134 | universal_dependencies/no_nynorsk/pos                        | universal_dependencies                      | no_nynorsk                     | pos         | udep__pos               | TokenClassification |\n| 135 | universal_dependencies/no_nynorsklia/pos                     | universal_dependencies                      | no_nynorsklia                  | pos         | udep__pos               | TokenClassification |\n| 136 | universal_dependencies/cu_proiel/pos                         | universal_dependencies                      | cu_proiel                      | pos         | udep__pos               | TokenClassification |\n| 137 | universal_dependencies/fro_srcmf/pos                         | universal_dependencies                      | fro_srcmf                      | pos         | udep__pos               | TokenClassification |\n| 138 | universal_dependencies/orv_rnc/pos                           | universal_dependencies                      | orv_rnc                        | pos         | udep__pos               | TokenClassification |\n| 139 | universal_dependencies/pl_lfg/pos                            | universal_dependencies                      | pl_lfg                         | pos         | udep__pos               | TokenClassification |\n| 140 | universal_dependencies/otk_tonqq/pos                         | universal_dependencies                      | otk_tonqq                      | pos         | udep__pos               | TokenClassification |\n| 141 | universal_dependencies/fa_perdt/pos                          | universal_dependencies                      | fa_perdt                       | pos         | udep__pos               | TokenClassification |\n| 142 | universal_dependencies/fa_seraji/pos                         | universal_dependencies                      | fa_seraji                      | pos         | udep__pos               | TokenClassification |\n| 143 | universal_dependencies/pcm_nsc/pos                           | universal_dependencies                      | pcm_nsc                        | pos         | udep__pos               | TokenClassification |\n| 144 | universal_dependencies/pl_pdb/pos                            | universal_dependencies                      | pl_pdb                         | pos         | udep__pos               | TokenClassification |\n| 145 | universal_dependencies/pl_pud/pos                            | universal_dependencies                      | pl_pud                         | pos         | udep__pos               | TokenClassification |\n| 146 | universal_dependencies/pt_bosque/pos                         | universal_dependencies                      | pt_bosque                      | pos         | udep__pos               | TokenClassification |\n| 147 | universal_dependencies/pt_gsd/pos                            | universal_dependencies                      | pt_gsd                         | pos         | udep__pos               | TokenClassification |\n| 148 | universal_dependencies/pt_pud/pos                            | universal_dependencies                      | pt_pud                         | pos         | udep__pos               | TokenClassification |\n| 149 | universal_dependencies/orv_torot/pos                         | universal_dependencies                      | orv_torot                      | pos         | udep__pos               | TokenClassification |\n| 150 | universal_dependencies/myu_tudet/pos                         | universal_dependencies                      | myu_tudet                      | pos         | udep__pos               | TokenClassification |\n| 151 | universal_dependencies/gv_cadhan/pos                         | universal_dependencies                      | gv_cadhan                      | pos         | udep__pos               | TokenClassification |\n| 152 | universal_dependencies/gun_thomas/pos                        | universal_dependencies                      | gun_thomas                     | pos         | udep__pos               | TokenClassification |\n| 153 | universal_dependencies/koi_uh/pos                            | universal_dependencies                      | koi_uh                         | pos         | udep__pos               | TokenClassification |\n| 154 | universal_dependencies/kpv_ikdp/pos                          | universal_dependencies                      | kpv_ikdp                       | pos         | udep__pos               | TokenClassification |\n| 155 | universal_dependencies/kpv_lattice/pos                       | universal_dependencies                      | kpv_lattice                    | pos         | udep__pos               | TokenClassification |\n| 156 | universal_dependencies/ko_gsd/pos                            | universal_dependencies                      | ko_gsd                         | pos         | udep__pos               | TokenClassification |\n| 157 | universal_dependencies/ko_kaist/pos                          | universal_dependencies                      | ko_kaist                       | pos         | udep__pos               | TokenClassification |\n| 158 | universal_dependencies/ko_pud/pos                            | universal_dependencies                      | ko_pud                         | pos         | udep__pos               | TokenClassification |\n| 159 | universal_dependencies/kmr_mg/pos                            | universal_dependencies                      | kmr_mg                         | pos         | udep__pos               | TokenClassification |\n| 160 | universal_dependencies/la_ittb/pos                           | universal_dependencies                      | la_ittb                        | pos         | udep__pos               | TokenClassification |\n| 161 | universal_dependencies/la_llct/pos                           | universal_dependencies                      | la_llct                        | pos         | udep__pos               | TokenClassification |\n| 162 | universal_dependencies/la_perseus/pos                        | universal_dependencies                      | la_perseus                     | pos         | udep__pos               | TokenClassification |\n| 163 | universal_dependencies/la_proiel/pos                         | universal_dependencies                      | la_proiel                      | pos         | udep__pos               | TokenClassification |\n| 164 | universal_dependencies/lv_lvtb/pos                           | universal_dependencies                      | lv_lvtb                        | pos         | udep__pos               | TokenClassification |\n| 165 | universal_dependencies/lt_alksnis/pos                        | universal_dependencies                      | lt_alksnis                     | pos         | udep__pos               | TokenClassification |\n| 166 | universal_dependencies/lt_hse/pos                            | universal_dependencies                      | lt_hse                         | pos         | udep__pos               | TokenClassification |\n| 167 | universal_dependencies/olo_kkpp/pos                          | universal_dependencies                      | olo_kkpp                       | pos         | udep__pos               | TokenClassification |\n| 168 | universal_dependencies/mt_mudt/pos                           | universal_dependencies                      | mt_mudt                        | pos         | udep__pos               | TokenClassification |\n| 169 | universal_dependencies/ro_nonstandard/pos                    | universal_dependencies                      | ro_nonstandard                 | pos         | udep__pos               | TokenClassification |\n| 170 | universal_dependencies/mr_ufal/pos                           | universal_dependencies                      | mr_ufal                        | pos         | udep__pos               | TokenClassification |\n| 171 | universal_dependencies/gun_dooley/pos                        | universal_dependencies                      | gun_dooley                     | pos         | udep__pos               | TokenClassification |\n| 172 | universal_dependencies/mdf_jr/pos                            | universal_dependencies                      | mdf_jr                         | pos         | udep__pos               | TokenClassification |\n| 173 | universal_dependencies/ro_rrt/pos                            | universal_dependencies                      | ro_rrt                         | pos         | udep__pos               | TokenClassification |\n| 174 | universal_dependencies/ru_taiga/pos                          | universal_dependencies                      | ru_taiga                       | pos         | udep__pos               | TokenClassification |\n| 175 | universal_dependencies/ru_gsd/pos                            | universal_dependencies                      | ru_gsd                         | pos         | udep__pos               | TokenClassification |\n| 176 | universal_dependencies/ta_mwtt/pos                           | universal_dependencies                      | ta_mwtt                        | pos         | udep__pos               | TokenClassification |\n| 177 | universal_dependencies/ta_ttb/pos                            | universal_dependencies                      | ta_ttb                         | pos         | udep__pos               | TokenClassification |\n| 178 | universal_dependencies/te_mtg/pos                            | universal_dependencies                      | te_mtg                         | pos         | udep__pos               | TokenClassification |\n| 179 | universal_dependencies/th_pud/pos                            | universal_dependencies                      | th_pud                         | pos         | udep__pos               | TokenClassification |\n| 180 | universal_dependencies/tpn_tudet/pos                         | universal_dependencies                      | tpn_tudet                      | pos         | udep__pos               | TokenClassification |\n| 181 | universal_dependencies/qtd_sagt/pos                          | universal_dependencies                      | qtd_sagt                       | pos         | udep__pos               | TokenClassification |\n| 182 | universal_dependencies/tr_boun/pos                           | universal_dependencies                      | tr_boun                        | pos         | udep__pos               | TokenClassification |\n| 183 | universal_dependencies/tr_gb/pos                             | universal_dependencies                      | tr_gb                          | pos         | udep__pos               | TokenClassification |\n| 184 | universal_dependencies/tr_imst/pos                           | universal_dependencies                      | tr_imst                        | pos         | udep__pos               | TokenClassification |\n| 185 | universal_dependencies/tr_pud/pos                            | universal_dependencies                      | tr_pud                         | pos         | udep__pos               | TokenClassification |\n| 186 | universal_dependencies/uk_iu/pos                             | universal_dependencies                      | uk_iu                          | pos         | udep__pos               | TokenClassification |\n| 187 | universal_dependencies/hsb_ufal/pos                          | universal_dependencies                      | hsb_ufal                       | pos         | udep__pos               | TokenClassification |\n| 188 | universal_dependencies/ur_udtb/pos                           | universal_dependencies                      | ur_udtb                        | pos         | udep__pos               | TokenClassification |\n| 189 | universal_dependencies/ug_udt/pos                            | universal_dependencies                      | ug_udt                         | pos         | udep__pos               | TokenClassification |\n| 190 | universal_dependencies/vi_vtb/pos                            | universal_dependencies                      | vi_vtb                         | pos         | udep__pos               | TokenClassification |\n| 191 | universal_dependencies/wbp_ufal/pos                          | universal_dependencies                      | wbp_ufal                       | pos         | udep__pos               | TokenClassification |\n| 192 | universal_dependencies/cy_ccg/pos                            | universal_dependencies                      | cy_ccg                         | pos         | udep__pos               | TokenClassification |\n| 193 | universal_dependencies/wo_wtb/pos                            | universal_dependencies                      | wo_wtb                         | pos         | udep__pos               | TokenClassification |\n| 194 | universal_dependencies/yo_ytb/pos                            | universal_dependencies                      | yo_ytb                         | pos         | udep__pos               | TokenClassification |\n| 195 | universal_dependencies/tl_ugnayan/pos                        | universal_dependencies                      | tl_ugnayan                     | pos         | udep__pos               | TokenClassification |\n| 196 | universal_dependencies/ro_simonero/pos                       | universal_dependencies                      | ro_simonero                    | pos         | udep__pos               | TokenClassification |\n| 197 | universal_dependencies/tl_trg/pos                            | universal_dependencies                      | tl_trg                         | pos         | udep__pos               | TokenClassification |\n| 198 | universal_dependencies/sv_talbanken/pos                      | universal_dependencies                      | sv_talbanken                   | pos         | udep__pos               | TokenClassification |\n| 199 | universal_dependencies/ru_pud/pos                            | universal_dependencies                      | ru_pud                         | pos         | udep__pos               | TokenClassification |\n| 200 | universal_dependencies/ru_syntagrus/pos                      | universal_dependencies                      | ru_syntagrus                   | pos         | udep__pos               | TokenClassification |\n| 201 | universal_dependencies/kfm_aha/pos                           | universal_dependencies                      | kfm_aha                        | pos         | udep__pos               | TokenClassification |\n| 202 | universal_dependencies/sa_ufal/pos                           | universal_dependencies                      | sa_ufal                        | pos         | udep__pos               | TokenClassification |\n| 203 | universal_dependencies/sa_vedic/pos                          | universal_dependencies                      | sa_vedic                       | pos         | udep__pos               | TokenClassification |\n| 204 | universal_dependencies/gd_arcosg/pos                         | universal_dependencies                      | gd_arcosg                      | pos         | udep__pos               | TokenClassification |\n| 205 | universal_dependencies/sr_set/pos                            | universal_dependencies                      | sr_set                         | pos         | udep__pos               | TokenClassification |\n| 206 | universal_dependencies/sms_giellagas/pos                     | universal_dependencies                      | sms_giellagas                  | pos         | udep__pos               | TokenClassification |\n| 207 | universal_dependencies/sk_snk/pos                            | universal_dependencies                      | sk_snk                         | pos         | udep__pos               | TokenClassification |\n| 208 | universal_dependencies/sl_ssj/pos                            | universal_dependencies                      | sl_ssj                         | pos         | udep__pos               | TokenClassification |\n| 209 | universal_dependencies/sl_sst/pos                            | universal_dependencies                      | sl_sst                         | pos         | udep__pos               | TokenClassification |\n| 210 | universal_dependencies/soj_aha/pos                           | universal_dependencies                      | soj_aha                        | pos         | udep__pos               | TokenClassification |\n| 211 | universal_dependencies/ajp_madar/pos                         | universal_dependencies                      | ajp_madar                      | pos         | udep__pos               | TokenClassification |\n| 212 | universal_dependencies/es_ancora/pos                         | universal_dependencies                      | es_ancora                      | pos         | udep__pos               | TokenClassification |\n| 213 | universal_dependencies/es_gsd/pos                            | universal_dependencies                      | es_gsd                         | pos         | udep__pos               | TokenClassification |\n| 214 | universal_dependencies/es_pud/pos                            | universal_dependencies                      | es_pud                         | pos         | udep__pos               | TokenClassification |\n| 215 | universal_dependencies/swl_sslc/pos                          | universal_dependencies                      | swl_sslc                       | pos         | udep__pos               | TokenClassification |\n| 216 | universal_dependencies/sv_lines/pos                          | universal_dependencies                      | sv_lines                       | pos         | udep__pos               | TokenClassification |\n| 217 | universal_dependencies/sv_pud/pos                            | universal_dependencies                      | sv_pud                         | pos         | udep__pos               | TokenClassification |\n| 218 | universal_dependencies/gsw_uzh/pos                           | universal_dependencies                      | gsw_uzh                        | pos         | udep__pos               | TokenClassification |\n| 219 | universal_dependencies/kk_ktb/pos                            | universal_dependencies                      | kk_ktb                         | pos         | udep__pos               | TokenClassification |\n| 220 | universal_dependencies/hi_hdtb/pos                           | universal_dependencies                      | hi_hdtb                        | pos         | udep__pos               | TokenClassification |\n| 221 | universal_dependencies/ja_pud/pos                            | universal_dependencies                      | ja_pud                         | pos         | udep__pos               | TokenClassification |\n| 222 | universal_dependencies/zh_gsd/pos                            | universal_dependencies                      | zh_gsd                         | pos         | udep__pos               | TokenClassification |\n| 223 | universal_dependencies/zh_gsdsimp/pos                        | universal_dependencies                      | zh_gsdsimp                     | pos         | udep__pos               | TokenClassification |\n| 224 | universal_dependencies/zh_hk/pos                             | universal_dependencies                      | zh_hk                          | pos         | udep__pos               | TokenClassification |\n| 225 | universal_dependencies/zh_pud/pos                            | universal_dependencies                      | zh_pud                         | pos         | udep__pos               | TokenClassification |\n| 226 | universal_dependencies/ckt_hse/pos                           | universal_dependencies                      | ckt_hse                        | pos         | udep__pos               | TokenClassification |\n| 227 | universal_dependencies/lzh_kyoto/pos                         | universal_dependencies                      | lzh_kyoto                      | pos         | udep__pos               | TokenClassification |\n| 228 | universal_dependencies/cop_scriptorium/pos                   | universal_dependencies                      | cop_scriptorium                | pos         | udep__pos               | TokenClassification |\n| 229 | universal_dependencies/hr_set/pos                            | universal_dependencies                      | hr_set                         | pos         | udep__pos               | TokenClassification |\n| 230 | universal_dependencies/cs_cac/pos                            | universal_dependencies                      | cs_cac                         | pos         | udep__pos               | TokenClassification |\n| 231 | universal_dependencies/cs_cltt/pos                           | universal_dependencies                      | cs_cltt                        | pos         | udep__pos               | TokenClassification |\n| 232 | universal_dependencies/cs_fictree/pos                        | universal_dependencies                      | cs_fictree                     | pos         | udep__pos               | TokenClassification |\n| 233 | universal_dependencies/cs_pdt/pos                            | universal_dependencies                      | cs_pdt                         | pos         | udep__pos               | TokenClassification |\n| 234 | universal_dependencies/cs_pud/pos                            | universal_dependencies                      | cs_pud                         | pos         | udep__pos               | TokenClassification |\n| 235 | universal_dependencies/da_ddt/pos                            | universal_dependencies                      | da_ddt                         | pos         | udep__pos               | TokenClassification |\n| 236 | universal_dependencies/nl_alpino/pos                         | universal_dependencies                      | nl_alpino                      | pos         | udep__pos               | TokenClassification |\n| 237 | universal_dependencies/nl_lassysmall/pos                     | universal_dependencies                      | nl_lassysmall                  | pos         | udep__pos               | TokenClassification |\n| 238 | universal_dependencies/en_esl/pos                            | universal_dependencies                      | en_esl                         | pos         | udep__pos               | TokenClassification |\n| 239 | universal_dependencies/en_ewt/pos                            | universal_dependencies                      | en_ewt                         | pos         | udep__pos               | TokenClassification |\n| 240 | universal_dependencies/en_gum/pos                            | universal_dependencies                      | en_gum                         | pos         | udep__pos               | TokenClassification |\n| 241 | universal_dependencies/zh_cfl/pos                            | universal_dependencies                      | zh_cfl                         | pos         | udep__pos               | TokenClassification |\n| 242 | universal_dependencies/ca_ancora/pos                         | universal_dependencies                      | ca_ancora                      | pos         | udep__pos               | TokenClassification |\n| 243 | universal_dependencies/yue_hk/pos                            | universal_dependencies                      | yue_hk                         | pos         | udep__pos               | TokenClassification |\n| 244 | universal_dependencies/bxr_bdt/pos                           | universal_dependencies                      | bxr_bdt                        | pos         | udep__pos               | TokenClassification |\n| 245 | universal_dependencies/af_afribooms/pos                      | universal_dependencies                      | af_afribooms                   | pos         | udep__pos               | TokenClassification |\n| 246 | universal_dependencies/krl_kkpp/pos                          | universal_dependencies                      | krl_kkpp                       | pos         | udep__pos               | TokenClassification |\n| 247 | universal_dependencies/akk_riao/pos                          | universal_dependencies                      | akk_riao                       | pos         | udep__pos               | TokenClassification |\n| 248 | universal_dependencies/aqz_tudet/pos                         | universal_dependencies                      | aqz_tudet                      | pos         | udep__pos               | TokenClassification |\n| 249 | universal_dependencies/sq_tsa/pos                            | universal_dependencies                      | sq_tsa                         | pos         | udep__pos               | TokenClassification |\n| 250 | universal_dependencies/am_att/pos                            | universal_dependencies                      | am_att                         | pos         | udep__pos               | TokenClassification |\n| 251 | universal_dependencies/grc_perseus/pos                       | universal_dependencies                      | grc_perseus                    | pos         | udep__pos               | TokenClassification |\n| 252 | universal_dependencies/grc_proiel/pos                        | universal_dependencies                      | grc_proiel                     | pos         | udep__pos               | TokenClassification |\n| 253 | universal_dependencies/apu_ufpa/pos                          | universal_dependencies                      | apu_ufpa                       | pos         | udep__pos               | TokenClassification |\n| 254 | universal_dependencies/en_gumreddit/pos                      | universal_dependencies                      | en_gumreddit                   | pos         | udep__pos               | TokenClassification |\n| 255 | universal_dependencies/ar_nyuad/pos                          | universal_dependencies                      | ar_nyuad                       | pos         | udep__pos               | TokenClassification |\n| 256 | universal_dependencies/ar_pud/pos                            | universal_dependencies                      | ar_pud                         | pos         | udep__pos               | TokenClassification |\n| 257 | universal_dependencies/hy_armtdp/pos                         | universal_dependencies                      | hy_armtdp                      | pos         | udep__pos               | TokenClassification |\n| 258 | universal_dependencies/aii_as/pos                            | universal_dependencies                      | aii_as                         | pos         | udep__pos               | TokenClassification |\n| 259 | universal_dependencies/bm_crb/pos                            | universal_dependencies                      | bm_crb                         | pos         | udep__pos               | TokenClassification |\n| 260 | universal_dependencies/eu_bdt/pos                            | universal_dependencies                      | eu_bdt                         | pos         | udep__pos               | TokenClassification |\n| 261 | universal_dependencies/be_hse/pos                            | universal_dependencies                      | be_hse                         | pos         | udep__pos               | TokenClassification |\n| 262 | universal_dependencies/bho_bhtb/pos                          | universal_dependencies                      | bho_bhtb                       | pos         | udep__pos               | TokenClassification |\n| 263 | universal_dependencies/br_keb/pos                            | universal_dependencies                      | br_keb                         | pos         | udep__pos               | TokenClassification |\n| 264 | universal_dependencies/bg_btb/pos                            | universal_dependencies                      | bg_btb                         | pos         | udep__pos               | TokenClassification |\n| 265 | universal_dependencies/ar_padt/pos                           | universal_dependencies                      | ar_padt                        | pos         | udep__pos               | TokenClassification |\n| 266 | universal_dependencies/en_lines/pos                          | universal_dependencies                      | en_lines                       | pos         | udep__pos               | TokenClassification |\n| 267 | universal_dependencies/akk_pisandub/pos                      | universal_dependencies                      | akk_pisandub                   | pos         | udep__pos               | TokenClassification |\n| 268 | universal_dependencies/en_pronouns/pos                       | universal_dependencies                      | en_pronouns                    | pos         | udep__pos               | TokenClassification |\n| 269 | universal_dependencies/el_gdt/pos                            | universal_dependencies                      | el_gdt                         | pos         | udep__pos               | TokenClassification |\n| 270 | universal_dependencies/he_htb/pos                            | universal_dependencies                      | he_htb                         | pos         | udep__pos               | TokenClassification |\n| 271 | universal_dependencies/qhe_hiencs/pos                        | universal_dependencies                      | qhe_hiencs                     | pos         | udep__pos               | TokenClassification |\n| 272 | universal_dependencies/hi_pud/pos                            | universal_dependencies                      | hi_pud                         | pos         | udep__pos               | TokenClassification |\n| 273 | universal_dependencies/hu_szeged/pos                         | universal_dependencies                      | hu_szeged                      | pos         | udep__pos               | TokenClassification |\n| 274 | universal_dependencies/is_icepahc/pos                        | universal_dependencies                      | is_icepahc                     | pos         | udep__pos               | TokenClassification |\n| 275 | universal_dependencies/id_csui/pos                           | universal_dependencies                      | id_csui                        | pos         | udep__pos               | TokenClassification |\n| 276 | universal_dependencies/id_gsd/pos                            | universal_dependencies                      | id_gsd                         | pos         | udep__pos               | TokenClassification |\n| 277 | universal_dependencies/id_pud/pos                            | universal_dependencies                      | id_pud                         | pos         | udep__pos               | TokenClassification |\n| 278 | universal_dependencies/ga_idt/pos                            | universal_dependencies                      | ga_idt                         | pos         | udep__pos               | TokenClassification |\n| 279 | universal_dependencies/it_isdt/pos                           | universal_dependencies                      | it_isdt                        | pos         | udep__pos               | TokenClassification |\n| 280 | universal_dependencies/it_partut/pos                         | universal_dependencies                      | it_partut                      | pos         | udep__pos               | TokenClassification |\n| 281 | universal_dependencies/it_postwita/pos                       | universal_dependencies                      | it_postwita                    | pos         | udep__pos               | TokenClassification |\n| 282 | universal_dependencies/it_pud/pos                            | universal_dependencies                      | it_pud                         | pos         | udep__pos               | TokenClassification |\n| 283 | universal_dependencies/it_twittiro/pos                       | universal_dependencies                      | it_twittiro                    | pos         | udep__pos               | TokenClassification |\n| 284 | universal_dependencies/it_vit/pos                            | universal_dependencies                      | it_vit                         | pos         | udep__pos               | TokenClassification |\n| 285 | universal_dependencies/ja_bccwj/pos                          | universal_dependencies                      | ja_bccwj                       | pos         | udep__pos               | TokenClassification |\n| 286 | universal_dependencies/ja_gsd/pos                            | universal_dependencies                      | ja_gsd                         | pos         | udep__pos               | TokenClassification |\n| 287 | universal_dependencies/ja_modern/pos                         | universal_dependencies                      | ja_modern                      | pos         | udep__pos               | TokenClassification |\n| 288 | universal_dependencies/got_proiel/pos                        | universal_dependencies                      | got_proiel                     | pos         | udep__pos               | TokenClassification |\n| 289 | universal_dependencies/de_pud/pos                            | universal_dependencies                      | de_pud                         | pos         | udep__pos               | TokenClassification |\n| 290 | universal_dependencies/is_pud/pos                            | universal_dependencies                      | is_pud                         | pos         | udep__pos               | TokenClassification |\n| 291 | universal_dependencies/de_hdt/pos                            | universal_dependencies                      | de_hdt                         | pos         | udep__pos               | TokenClassification |\n| 292 | universal_dependencies/en_pud/pos                            | universal_dependencies                      | en_pud                         | pos         | udep__pos               | TokenClassification |\n| 293 | universal_dependencies/myv_jr/pos                            | universal_dependencies                      | myv_jr                         | pos         | udep__pos               | TokenClassification |\n| 294 | universal_dependencies/de_lit/pos                            | universal_dependencies                      | de_lit                         | pos         | udep__pos               | TokenClassification |\n| 295 | universal_dependencies/et_ewt/pos                            | universal_dependencies                      | et_ewt                         | pos         | udep__pos               | TokenClassification |\n| 296 | universal_dependencies/fo_farpahc/pos                        | universal_dependencies                      | fo_farpahc                     | pos         | udep__pos               | TokenClassification |\n| 297 | universal_dependencies/fo_oft/pos                            | universal_dependencies                      | fo_oft                         | pos         | udep__pos               | TokenClassification |\n| 298 | universal_dependencies/fi_ftb/pos                            | universal_dependencies                      | fi_ftb                         | pos         | udep__pos               | TokenClassification |\n| 299 | universal_dependencies/fi_ood/pos                            | universal_dependencies                      | fi_ood                         | pos         | udep__pos               | TokenClassification |\n| 300 | universal_dependencies/fi_pud/pos                            | universal_dependencies                      | fi_pud                         | pos         | udep__pos               | TokenClassification |\n| 301 | universal_dependencies/fi_tdt/pos                            | universal_dependencies                      | fi_tdt                         | pos         | udep__pos               | TokenClassification |\n| 302 | universal_dependencies/et_edt/pos                            | universal_dependencies                      | et_edt                         | pos         | udep__pos               | TokenClassification |\n| 303 | universal_dependencies/fr_ftb/pos                            | universal_dependencies                      | fr_ftb                         | pos         | udep__pos               | TokenClassification |\n| 304 | universal_dependencies/fr_fqb/pos                            | universal_dependencies                      | fr_fqb                         | pos         | udep__pos               | TokenClassification |\n| 305 | universal_dependencies/de_gsd/pos                            | universal_dependencies                      | de_gsd                         | pos         | udep__pos               | TokenClassification |\n| 306 | universal_dependencies/gl_treegal/pos                        | universal_dependencies                      | gl_treegal                     | pos         | udep__pos               | TokenClassification |\n| 307 | universal_dependencies/gl_ctg/pos                            | universal_dependencies                      | gl_ctg                         | pos         | udep__pos               | TokenClassification |\n| 308 | universal_dependencies/fr_spoken/pos                         | universal_dependencies                      | fr_spoken                      | pos         | udep__pos               | TokenClassification |\n| 309 | universal_dependencies/en_partut/pos                         | universal_dependencies                      | en_partut                      | pos         | udep__pos               | TokenClassification |\n| 310 | universal_dependencies/fr_pud/pos                            | universal_dependencies                      | fr_pud                         | pos         | udep__pos               | TokenClassification |\n| 311 | universal_dependencies/fr_partut/pos                         | universal_dependencies                      | fr_partut                      | pos         | udep__pos               | TokenClassification |\n| 312 | universal_dependencies/fr_sequoia/pos                        | universal_dependencies                      | fr_sequoia                     | pos         | udep__pos               | TokenClassification |\n| 313 | universal_dependencies/fr_gsd/pos                            | universal_dependencies                      | fr_gsd                         | pos         | udep__pos               | TokenClassification |\n| 314 | oasst1_pairwise_rlhf_reward                                  | tasksource/oasst1_pairwise_rlhf_reward      |                                |             | oasst_rlhf              | MultipleChoice      |\n| 315 | multilingual-sentiments/all                                  | tyqiangz/multilingual-sentiments            | all                            |             | sentiment               | Classification      |\n| 316 | tweet_sentiment_multilingual/arabic                          | cardiffnlp/tweet_sentiment_multilingual     | arabic                         |             | tweet_sentiment         | Classification      |\n| 317 | tweet_sentiment_multilingual/french                          | cardiffnlp/tweet_sentiment_multilingual     | french                         |             | tweet_sentiment         | Classification      |\n| 318 | tweet_sentiment_multilingual/english                         | cardiffnlp/tweet_sentiment_multilingual     | english                        |             | tweet_sentiment         | Classification      |\n| 319 | tweet_sentiment_multilingual/hindi                           | cardiffnlp/tweet_sentiment_multilingual     | hindi                          |             | tweet_sentiment         | Classification      |\n| 320 | tweet_sentiment_multilingual/portuguese                      | cardiffnlp/tweet_sentiment_multilingual     | portuguese                     |             | tweet_sentiment         | Classification      |\n| 321 | tweet_sentiment_multilingual/spanish                         | cardiffnlp/tweet_sentiment_multilingual     | spanish                        |             | tweet_sentiment         | Classification      |\n| 322 | tweet_sentiment_multilingual/all                             | cardiffnlp/tweet_sentiment_multilingual     | all                            |             | tweet_sentiment         | Classification      |\n| 323 | tweet_sentiment_multilingual/german                          | cardiffnlp/tweet_sentiment_multilingual     | german                         |             | tweet_sentiment         | Classification      |\n| 324 | tweet_sentiment_multilingual/italian                         | cardiffnlp/tweet_sentiment_multilingual     | italian                        |             | tweet_sentiment         | Classification      |\n| 325 | amazon_reviews_multi/all_languages                           | amazon_reviews_multi                        | all_languages                  |             | review_sentiment        | Classification      |\n| 326 | universal-joy                                                | metaeval/universal-joy                      |                                |             | emotion                 | Classification      |\n| 327 | mms                                                          | Brand24/mms                                 |                                |             | mms_sentiment           | Classification      |\n| 328 | mapa                                                         | joelito/mapa                                |                                |             | mapa_fine               | TokenClassification |\n| 329 | mapa                                                         | joelito/mapa                                |                                |             | mapa_corase             | TokenClassification |\n| 330 | ACES                                                         | nikitam/ACES                                |                                |             | aces_ranking            | MultipleChoice      |\n| 331 | ACES                                                         | nikitam/ACES                                |                                |             | aces_phenomena          | Classification      |\n| 332 | massive/my-MM                                                | AmazonScience/massive                       | my-MM                          |             | amazon_intent           | Classification      |\n| 333 | massive/ro-RO                                                | AmazonScience/massive                       | ro-RO                          |             | amazon_intent           | Classification      |\n| 334 | massive/pt-PT                                                | AmazonScience/massive                       | pt-PT                          |             | amazon_intent           | Classification      |\n| 335 | massive/pl-PL                                                | AmazonScience/massive                       | pl-PL                          |             | amazon_intent           | Classification      |\n| 336 | massive/nl-NL                                                | AmazonScience/massive                       | nl-NL                          |             | amazon_intent           | Classification      |\n| 337 | massive/nb-NO                                                | AmazonScience/massive                       | nb-NO                          |             | amazon_intent           | Classification      |\n| 338 | massive/es-ES                                                | AmazonScience/massive                       | es-ES                          |             | amazon_intent           | Classification      |\n| 339 | massive/ms-MY                                                | AmazonScience/massive                       | ms-MY                          |             | amazon_intent           | Classification      |\n| 340 | massive/mn-MN                                                | AmazonScience/massive                       | mn-MN                          |             | amazon_intent           | Classification      |\n| 341 | massive/ml-IN                                                | AmazonScience/massive                       | ml-IN                          |             | amazon_intent           | Classification      |\n| 342 | massive/lv-LV                                                | AmazonScience/massive                       | lv-LV                          |             | amazon_intent           | Classification      |\n| 343 | massive/ko-KR                                                | AmazonScience/massive                       | ko-KR                          |             | amazon_intent           | Classification      |\n| 344 | massive/ru-RU                                                | AmazonScience/massive                       | ru-RU                          |             | amazon_intent           | Classification      |\n| 345 | massive/kn-IN                                                | AmazonScience/massive                       | kn-IN                          |             | amazon_intent           | Classification      |\n| 346 | massive/ka-GE                                                | AmazonScience/massive                       | ka-GE                          |             | amazon_intent           | Classification      |\n| 347 | massive/jv-ID                                                | AmazonScience/massive                       | jv-ID                          |             | amazon_intent           | Classification      |\n| 348 | massive/ja-JP                                                | AmazonScience/massive                       | ja-JP                          |             | amazon_intent           | Classification      |\n| 349 | massive/it-IT                                                | AmazonScience/massive                       | it-IT                          |             | amazon_intent           | Classification      |\n| 350 | massive/is-IS                                                | AmazonScience/massive                       | is-IS                          |             | amazon_intent           | Classification      |\n| 351 | massive/id-ID                                                | AmazonScience/massive                       | id-ID                          |             | amazon_intent           | Classification      |\n| 352 | massive/hy-AM                                                | AmazonScience/massive                       | hy-AM                          |             | amazon_intent           | Classification      |\n| 353 | massive/hu-HU                                                | AmazonScience/massive                       | hu-HU                          |             | amazon_intent           | Classification      |\n| 354 | massive/hi-IN                                                | AmazonScience/massive                       | hi-IN                          |             | amazon_intent           | Classification      |\n| 355 | massive/he-IL                                                | AmazonScience/massive                       | he-IL                          |             | amazon_intent           | Classification      |\n| 356 | massive/fr-FR                                                | AmazonScience/massive                       | fr-FR                          |             | amazon_intent           | Classification      |\n| 357 | massive/km-KH                                                | AmazonScience/massive                       | km-KH                          |             | amazon_intent           | Classification      |\n| 358 | massive/fi-FI                                                | AmazonScience/massive                       | fi-FI                          |             | amazon_intent           | Classification      |\n| 359 | massive/sl-SL                                                | AmazonScience/massive                       | sl-SL                          |             | amazon_intent           | Classification      |\n| 360 | massive/sv-SE                                                | AmazonScience/massive                       | sv-SE                          |             | amazon_intent           | Classification      |\n| 361 | massive/af-ZA                                                | AmazonScience/massive                       | af-ZA                          |             | amazon_intent           | Classification      |\n| 362 | massive/am-ET                                                | AmazonScience/massive                       | am-ET                          |             | amazon_intent           | Classification      |\n| 363 | massive/ar-SA                                                | AmazonScience/massive                       | ar-SA                          |             | amazon_intent           | Classification      |\n| 364 | massive/az-AZ                                                | AmazonScience/massive                       | az-AZ                          |             | amazon_intent           | Classification      |\n| 365 | massive/bn-BD                                                | AmazonScience/massive                       | bn-BD                          |             | amazon_intent           | Classification      |\n| 366 | massive/ca-ES                                                | AmazonScience/massive                       | ca-ES                          |             | amazon_intent           | Classification      |\n| 367 | massive/cy-GB                                                | AmazonScience/massive                       | cy-GB                          |             | amazon_intent           | Classification      |\n| 368 | massive/da-DK                                                | AmazonScience/massive                       | da-DK                          |             | amazon_intent           | Classification      |\n| 369 | massive/de-DE                                                | AmazonScience/massive                       | de-DE                          |             | amazon_intent           | Classification      |\n| 370 | massive/el-GR                                                | AmazonScience/massive                       | el-GR                          |             | amazon_intent           | Classification      |\n| 371 | massive/sq-AL                                                | AmazonScience/massive                       | sq-AL                          |             | amazon_intent           | Classification      |\n| 372 | massive/en-US                                                | AmazonScience/massive                       | en-US                          |             | amazon_intent           | Classification      |\n| 373 | massive/all                                                  | AmazonScience/massive                       | all                            |             | amazon_intent           | Classification      |\n| 374 | massive/zh-TW                                                | AmazonScience/massive                       | zh-TW                          |             | amazon_intent           | Classification      |\n| 375 | massive/zh-CN                                                | AmazonScience/massive                       | zh-CN                          |             | amazon_intent           | Classification      |\n| 376 | massive/vi-VN                                                | AmazonScience/massive                       | vi-VN                          |             | amazon_intent           | Classification      |\n| 377 | massive/ur-PK                                                | AmazonScience/massive                       | ur-PK                          |             | amazon_intent           | Classification      |\n| 378 | massive/tr-TR                                                | AmazonScience/massive                       | tr-TR                          |             | amazon_intent           | Classification      |\n| 379 | massive/tl-PH                                                | AmazonScience/massive                       | tl-PH                          |             | amazon_intent           | Classification      |\n| 380 | massive/th-TH                                                | AmazonScience/massive                       | th-TH                          |             | amazon_intent           | Classification      |\n| 381 | massive/te-IN                                                | AmazonScience/massive                       | te-IN                          |             | amazon_intent           | Classification      |\n| 382 | massive/ta-IN                                                | AmazonScience/massive                       | ta-IN                          |             | amazon_intent           | Classification      |\n| 383 | massive/sw-KE                                                | AmazonScience/massive                       | sw-KE                          |             | amazon_intent           | Classification      |\n| 384 | massive/all_1.1                                              | AmazonScience/massive                       | all_1.1                        |             | amazon_intent           | Classification      |\n| 385 | massive/fa-IR                                                | AmazonScience/massive                       | fa-IR                          |             | amazon_intent           | Classification      |\n| 386 | tydi-as2-balanced                                            | tasksource/tydi-as2-balanced                |                                |             | tidy_as2                | Classification      |\n| 387 | multiconer_v2/Hindi (HI)                                     | MultiCoNER/multiconer_v2                    | Hindi (HI)                     |             | multiconer              | TokenClassification |\n| 388 | multiconer_v2/Multilingual (MULTI)                           | MultiCoNER/multiconer_v2                    | Multilingual (MULTI)           |             | multiconer              | TokenClassification |\n| 389 | multiconer_v2/Ukrainian (UK)                                 | MultiCoNER/multiconer_v2                    | Ukrainian (UK)                 |             | multiconer              | TokenClassification |\n| 390 | multiconer_v2/Swedish (SV)                                   | MultiCoNER/multiconer_v2                    | Swedish (SV)                   |             | multiconer              | TokenClassification |\n| 391 | multiconer_v2/Spanish (ES)                                   | MultiCoNER/multiconer_v2                    | Spanish (ES)                   |             | multiconer              | TokenClassification |\n| 392 | multiconer_v2/Bangla (BN)                                    | MultiCoNER/multiconer_v2                    | Bangla (BN)                    |             | multiconer              | TokenClassification |\n| 393 | multiconer_v2/Chinese (ZH)                                   | MultiCoNER/multiconer_v2                    | Chinese (ZH)                   |             | multiconer              | TokenClassification |\n| 394 | multiconer_v2/English (EN)                                   | MultiCoNER/multiconer_v2                    | English (EN)                   |             | multiconer              | TokenClassification |\n| 395 | multiconer_v2/Farsi (FA)                                     | MultiCoNER/multiconer_v2                    | Farsi (FA)                     |             | multiconer              | TokenClassification |\n| 396 | multiconer_v2/Portuguese (PT)                                | MultiCoNER/multiconer_v2                    | Portuguese (PT)                |             | multiconer              | TokenClassification |\n| 397 | multiconer_v2/German (DE)                                    | MultiCoNER/multiconer_v2                    | German (DE)                    |             | multiconer              | TokenClassification |\n| 398 | multiconer_v2/Italian (IT)                                   | MultiCoNER/multiconer_v2                    | Italian (IT)                   |             | multiconer              | TokenClassification |\n| 399 | multiconer_v2/French (FR)                                    | MultiCoNER/multiconer_v2                    | French (FR)                    |             | multiconer              | TokenClassification |\n| 400 | mtop                                                         | tasksource/mtop                             |                                |             | mtop                    | Classification      |\n| 401 | multilingual-zero-shot-label-nli                             | tasksource/multilingual-zero-shot-label-nli |                                |             | mlabel_nli              | Classification      |\n"
  },
  {
    "path": "pyproject.toml",
    "content": "[build-system]\nrequires = [\"setuptools>=45\", \"setuptools_scm[toml]>=6.2\"]\nbuild-backend = \"setuptools.build_meta\"\n\n[tool.setuptools_scm]\n"
  },
  {
    "path": "setup.cfg",
    "content": " [metadata]\nname = tasksource\ndescription = Preprocessings to prepare datasets for a task\nlong_description = file: README.md\nlong_description_content_type = text/markdown\nurl = https://github.com/sileod/tasksource/\nclassifiers =\n    Programming Language :: Python :: 3\n    License :: OSI Approved :: BSD License\n    Intended Audience :: Developers\n\n[options]\npackage_dir =\n    = src\npackages = find:\npython_requires = >=3.6\ninstall_requires =\n    dotwiz\n    funcy\n    datasets\n    exrex\n    magicattr\n    pandas\n    numpy\n    scipy\n    sorcery\n\n[options.packages.find]\nwhere = src\n"
  },
  {
    "path": "src/tasksource/.ipynb_checkpoints/access-checkpoint.py",
    "content": "from .preprocess import Preprocessing\nimport re\nimport pandas as pd\nfrom . import tasks, recast\nfrom .metadata import dataset_rank\nfrom datasets import load_dataset\nimport funcy as fc\nimport os\nimport copy\nfrom sorcery import dict_of\nfrom functools import cache\nimport random\n\n\nclass lazy_mtasks:\n    def __getattr__(self, name):\n        from . import mtasks\n        return getattr(mtasks, name)\n\n    def __dir__(self):\n        from . import mtasks\n        return dir(mtasks)\nlmtasks=lazy_mtasks()\n\ndef parse_var_name(s):\n    config_name,task_name = None,None\n    if '__' in s and '___' not in s: # dataset__task\n        dataset_name, task_name = s.split('__') \n    elif '__' not in s.replace('___','') and '___' in s: #dataset___config\n        dataset_name, config_name = s.split('___') \n    elif  '___' in s and '__' in s.split('___')[1]: #dataset___config__task\n        dataset_name, config_task=s.split('___')\n        config_name,task_name = config_task.split('__')\n    else: # dataset \n        dataset_name = s\n    return dataset_name,config_name,task_name\n\ndef pretty_name(x):\n    dn = x.dataset_name.split(\"/\")[-1]   \n    cn = x.config_name if x.config_name else \"\"\n    tn = x.task_name if x.task_name else \"\"\n    return f\"{dn}/{cn}/{tn}\".replace('//','/').rstrip('/')\n\n@cache\ndef list_tasks(tasks_path=f'{os.path.dirname(__file__)}/tasks.py',multilingual=False,instruct=False, excluded=[]):\n    if multilingual:\n        tasks_path=tasks_path.replace('/tasks.py','/mtasks.py')\n    task_order = open(tasks_path).readlines()\n    task_order = [x.split('=')[0].rstrip() for x in task_order if '=' in x]\n    task_order = [x for x in task_order if x.isidentifier()]\n    task_order = fc.flip(dict(enumerate(task_order)))\n\n    l = []\n    _tasks = (lmtasks if multilingual else tasks)\n\n    for key in dir(_tasks):\n        if key not in task_order:\n            continue\n        value=getattr(_tasks, key)\n        if isinstance(value,Preprocessing):\n            dataset_name, config_name, task_name = parse_var_name(key)\n            dataset_name = (value.dataset_name if value.dataset_name else dataset_name)\n            config_name = (value.config_name if value.config_name else config_name)\n            hasattr(value,key)\n            l+=[{'dataset_name': dataset_name,\n                 'config_name' : config_name,\n                 'task_name': task_name,\n                 'preprocessing_name': key,\n                'task_type': value.__class__.__name__,'mapping': value,\n                'rank':task_order.get(key,None)}]   \n    df=pd.DataFrame(l).explode('config_name')\n    df = df.sort_values('rank').reset_index(drop=True)\n    df['id'] = df.apply(lambda x: pretty_name(x), axis=1)\n    df.insert(0, 'id', df.pop('id'))\n    del df['rank']\n    if instruct:\n        df=df[df.id.map(lambda x: not any(a in x for a in recast.improper_labels))]\n    df=df[df.id.map(lambda x: not any(x in a for a in excluded))]\n    return df\n\n#task_df =list_tasks()\n#mtask_df =list_tasks(multilingual=True)\n\ndef dict_to_query(d=dict(), **kwargs):\n    d={**d,**kwargs}\n    return '&'.join([f'`{k}`==\"{v}\"' for k,v in d.items()])\n\ndef load_preprocessing(tasks=tasks, **kwargs):\n    _tasks_df = list_tasks(multilingual=tasks==lmtasks)\n    y = _tasks_df.copy().query(dict_to_query(**kwargs)).iloc[0]\n    preprocessing= copy.copy(getattr(tasks, y.preprocessing_name))\n    for c in 'dataset_name','config_name':\n        if not isinstance(getattr(preprocessing,c), str):\n             setattr(preprocessing,c,getattr(y,c))\n    return preprocessing\n\ndef load_task(id=None, dataset_name=None,config_name=None,task_name=None,preprocessing_name=None,\n         max_rows=None, max_rows_eval=None, multilingual=False, instruct=False, seed=0, **load_dataset_kwargs):\n    query = dict_of(id, dataset_name, config_name, task_name,preprocessing_name)\n    query = {k:v for k,v in query.items() if v}\n    _tasks = (lmtasks if multilingual else tasks)\n    preprocessing = load_preprocessing(_tasks, **query)\n\n    if \"trust_remote_code\" not in load_dataset_kwargs:\n        load_dataset_kwargs[\"trust_remote_code\"] = True\n    \n    dataset = load_dataset(preprocessing.dataset_name, preprocessing.config_name, **load_dataset_kwargs)\n    dataset= preprocessing(dataset,max_rows, max_rows_eval)\n    dataset.task_type = preprocessing.__class__.__name__\n    if instruct:\n        dataset=recast.recast_instruct(dataset)\n    return dataset"
  },
  {
    "path": "src/tasksource/.ipynb_checkpoints/preprocess-checkpoint.py",
    "content": "from collections.abc import Iterable\nfrom dotwiz import DotWiz\nfrom dataclasses import dataclass\nfrom typing import Union\nimport itertools\nimport funcy as fc\nimport exrex \nimport magicattr \nimport numpy as np\nimport copy\nimport datasets\nimport time\n\nMAX_MC_OPTIONS = 4\n\ndef get_column_names(dataset):\n    cn = dataset.column_names\n    if type(cn)==dict:\n        return set(fc.flatten(cn.values()))\n    else:\n        return set(cn)\n\n\ndef sample_dataset(dataset,n=10000, n_eval=1000,seed=0):\n    for k in dataset:\n        n_k=(n if k=='train' else n_eval)\n        if n_k and len(dataset[k])>n_k:\n            dataset[k]=dataset[k].train_test_split(train_size=n_k,seed=seed)['train']\n    return dataset\n\nclass Preprocessing(DotWiz):\n    default_splits = ('train','validation','test')\n    _instances = []\n\n    def __post_init__(self):\n        Preprocessing._instances+=[self]\n\n    @staticmethod\n    def __map_to_target(x,fn=lambda x:None, target=None):\n        x[target]=fn(x)\n        return x\n        \n    def load(self):\n        return self(datasets.load_dataset(self.dataset_name,self.config_name))\n\n    def __call__(self,dataset, max_rows=None, max_rows_eval=None,seed=0):\n        dataset = self.pre_process(dataset)\n\n        # manage splits\n        for k,v in zip(self.default_splits, self.splits):\n            if v and k!=v:\n                dataset[k]=dataset[v]\n                del dataset[v]\n            if k in dataset and not v: # obfuscated label\n                del dataset[k]\n        dataset = fix_splits(dataset)\n\n        for k in list(dataset.keys()):\n            if k not in self.default_splits:\n                del dataset[k]\n        dataset = sample_dataset(dataset, max_rows, max_rows_eval,seed=seed)\n        \n        # field annotated with a string\n        substitutions = {v:k for k,v in self.to_dict().items()\n            if (k and k not in {'splits','dataset_name','config_name'} \n            and type(v)==str and k!=v)}\n\n        dataset=dataset.remove_columns([c for c in substitutions.values() if c in dataset['train'].features and c not in substitutions])\n        dataset=dataset.rename_columns(substitutions)\n\n        # field annotated with a function                                \n        for k in self.to_dict().keys():\n            v=getattr(self, k)\n            if callable(v) and k not in {\"post_process\",\"pre_process\",\"load\"}:\n                dataset=dataset.map(self.__map_to_target,\n                                    fn_kwargs={'fn':v,'target':k})\n\n        dataset=dataset.remove_columns(\n            get_column_names(dataset)-set(self.to_dict().keys()))\n        dataset = fix_labels(dataset)\n        dataset = fix_splits(dataset) # again: label mapping changed\n        dataset = self.post_process(dataset)\n        return dataset\n\n\n@dataclass\nclass cat(Preprocessing):\n    fields:Union[str,list]=None\n    separator:str=' '\n        \n    def __call__(self, example=None):\n        y=[np.char.array(example[f]) + sep \n                for f,sep in zip(self.fields[::-1],itertools.repeat(self.separator))]\n        y=list(sum(*y))\n        if len(y)==1:\n            y=y[0]\n        return y\n\n\ndef pretty(f):\n    class pretty_f(DotWiz):\n        def __init__(self,*args):\n            self.__f_arg = f(*args)\n            for a in args:\n                setattr(self,'value',a)\n                \n        def __call__(self, *args,**kwargs):\n            return self.__f_arg(*args,**kwargs)\n\n        def __repr__(self):\n            return f\"{self.__f_arg.__qualname__ .split('.')[0]}({self.value})\"\n    return pretty_f\n\nclass dotgetter:\n    def __init__(self, path=''):\n        self.path=path\n\n    def __bool__(self):\n        return bool(self.path)\n\n    def __getattr__(self, k):\n        return self.__class__(f'{self.path}.{k}'.lstrip('.'))\n    \n    def __getitem__(self, i):\n        return self.__class__(f'{self.path}[{i}]')\n\n    def __call__(self, example=None):\n        return magicattr.get(DotWiz(example), self.path)\n\n    def __hash__(self):\n        return hash(self.path)\n\n\n@dataclass\nclass ClassificationFields(Preprocessing):\n    sentence1:str='sentence1'\n    sentence2:str='sentence2'\n    labels:str='labels'\n\n@dataclass\nclass Seq2SeqLMFields(Preprocessing):\n    prompt:str='prompt'\n    output:str='output'\n\n@dataclass\nclass TokenClassificationFields(Preprocessing):\n    tokens:str='tokens'\n    labels:str='labels'\n        \n@dataclass\nclass MultipleChoiceFields(Preprocessing):\n    inputs:str='input'\n    choices:Iterable=tuple()\n    labels:str='labels'\n    choices_list:str=None\n    def __post_init__(self):\n        for i, c in enumerate(self.choices):\n            setattr(self,f'choice{i}',c)\n        delattr(self,'choices')\n        if not self.choices_list:\n            delattr(self,'choices_list')\n    \n    def __call__(self,dataset, *args, **kwargs):\n        dataset = super().__call__(dataset, *args, **kwargs)\n        if self.choices_list:\n            dataset = dataset.filter(lambda x: 1<len(x['choices_list']))\n            n_options = min([len(x) for k in dataset for x in dataset[k]['choices_list']])\n            n_options = min(MAX_MC_OPTIONS,n_options)\n            dataset = dataset.map(self.flatten_choice_list, fn_kwargs={'n_options':n_options})\n\n        else:\n            dataset = dataset.map(self.sample_choices, fn_kwargs={'n_options':MAX_MC_OPTIONS})\n        return dataset\n\n    @staticmethod\n    def flatten_choice_list(x, n_options=None):\n        n_neg = n_options-1 if n_options else None\n        choices = x['choices_list']\n        label=x['labels']\n        neg = choices[:label] + choices[label+1:]\n        pos = choices[label]\n        x['labels']=0\n        x['choices_list']=[pos]+neg[:n_neg]\n        for i,o in enumerate(x['choices_list']):\n            x[f'choice{i}']=o\n        del x['choices_list']\n        return x\n\n    @staticmethod\n    def sample_choices(x, n_options=None):\n        choices = [x[c] for c in x if 'choice' in c]\n        if not MAX_MC_OPTIONS or len(choices)<=n_options:\n            return x\n        n_neg = n_options-1 if n_options else None\n        label=x['labels']\n        neg = choices[:label] + choices[label+1:]\n        pos = choices[label]\n        x['labels']=0\n        choices_list=[pos]+neg[:n_neg]\n        for c in list(x):\n            if 'choice' in c:\n                del x[c]\n        for i,o in enumerate(choices_list):\n            x[f'choice{i}']=o\n        return x\n\n@dataclass\nclass SharedFields:\n    splits:list=Preprocessing.default_splits\n    dataset_name:str = None\n    config_name:str = None\n    pre_process: callable = fc.identity\n    post_process: callable = fc.identity\n    #language:str=\"en\"\n    \n\n@dataclass\nclass Classification(SharedFields, ClassificationFields): pass\n\n@dataclass\nclass MultipleChoice(SharedFields, MultipleChoiceFields): pass\n\n@dataclass\nclass TokenClassification(SharedFields, TokenClassificationFields): pass\n\n@dataclass\nclass Seq2SeqLM(SharedFields, Seq2SeqLMFields): pass\n\nget=dotgetter()\nconstant = pretty(fc.constantly)\nregen = lambda x: list(exrex.generate(x))\n\ndef name(label_name, classes):\n    return lambda x:classes[x[label_name]]\n\ndef fix_splits(dataset):\n\n    if len(dataset)==1 and \"train\" not in dataset:\n        k = list(dataset)[0]\n        dataset['train'] = copy.deepcopy(dataset[k])\n        del dataset[k]\n\n    if 'auxiliary_train' in dataset:\n        del dataset['auxiliary_train']\n    \n    if 'test' in dataset: # manage obfuscated labels\n        if 'labels' in dataset['test'].features:\n            if len(set(fc.flatten(dataset['test'].to_dict()['labels'])))==1:\n                del dataset['test']\n\n    if 'validation' in dataset and 'train' not in dataset:\n        train_validation = dataset['validation'].train_test_split(0.5, seed=0)\n        dataset['train'] = train_validation['train']\n        dataset['validation']=train_validation['test']\n    \n    if 'validation' in dataset and 'test' not in dataset:\n        validation_test = dataset['validation'].train_test_split(0.5, seed=0)\n        dataset['validation'] = validation_test['train']\n        dataset['test']=validation_test['test']\n\n    if 'train' in dataset and 'validation' not in dataset:\n        train_val = dataset['train'].train_test_split(train_size=0.90, seed=0)\n        dataset['train'] = train_val['train']\n        dataset['validation']=train_val['test']\n\n    if 'test' in dataset and 'validation' not in dataset:\n        validation_test = dataset['test'].train_test_split(0.5, seed=0)\n        dataset['validation'] = validation_test['train']\n        dataset['test']=validation_test['test']\n\n    if 'validation' not in dataset and 'test' not in dataset:\n        train_val_test = dataset[\"train\"].train_test_split(train_size=0.90, seed=0)\n        val_test = train_val_test[\"test\"].train_test_split(0.5, seed=0)\n        dataset[\"train\"] = train_val_test[\"train\"]\n        dataset[\"validation\"] = val_test[\"train\"]\n        dataset[\"test\"] = val_test[\"test\"]\n        \n    return dataset \n\ndef fix_labels(dataset, label_key='labels'):\n    if type(dataset['train'][label_key][0]) in [int,list,float]:\n        return dataset\n    labels=set(fc.flatten(dataset[k][label_key] for k in {\"train\"}))\n    if set(labels)=={'entailment','neutral','contradiction'}:\n        order=lambda x:dict(fc.flip(enumerate(['entailment','neutral','contradiction']))).get(x,x)\n    else:\n        order=str\n    labels=sorted(labels, key=order)\n    dataset=dataset.cast_column(label_key, datasets.ClassLabel(names=labels))\n    return dataset\n\ndef concatenate_dataset_dict(l):\n    \"\"\"Concatenate a list of DatastDict objects sharing same splits and columns.\"\"\"\n    keys=l[0].keys()\n    return datasets.DatasetDict({k: datasets.concatenate_datasets([x[k] for x in l]) for k in keys})"
  },
  {
    "path": "src/tasksource/.ipynb_checkpoints/recast-checkpoint.py",
    "content": "import random\nfrom datasets import DatasetDict, Dataset\nfrom sorcery import dict_of\nimport string\n\nimproper_labels =['recast/recast_kg_relations','linguisticprobing',\"lex_glue/scotus\",'lexical_relation_classification/ROOT09',\"pragmeval/squinky\",\"pragmeval/emobank\",'pragmeval/persuasiveness']\nimproper_labels += ['glue/stsb', 'sick/relatedness', 'joci', 'utilitarianism', 'amazon_counterfactual/en', 'toxic_conversations', 'ethos/multilabel', 'lex_glue/eurlex', 'lex_glue/unfair_tos', 'app_reviews', 'humicroedit/subtask-1', 'stackoverflow-questions', 'go_emotions/simplified', 'google_wellformed_query', 'has_part', 'blog_authorship_corpus/age', 'promptCoherence', 'Sarcasm_News_Headline', 'auditor_review/demo-org--auditor_review', 'Dynasent_Disagreement', 'Politeness_Disagreement', 'SBIC_Disagreement', 'SChem_Disagreement', 'Dilemmas_Disagreement', 'sts-companion', 'acceptability-prediction', 'chaos-mnli-ambiguity', 'headline_cause/en_simple', 'oasst1_dense_flat', 'civil_comments']\n\nimproper_labels += ['stsb_multi_mt','MLMA_hate_speech','icl-symbol-tuning-instruct','zero-shot-label-nli']\n\nimproper_labels += ['essay-scoring','english-grading','HelpSteer','oasst2']\n\ndef render_options(options):\n    options = [f'\"{x}\"' for x in options]\n    return f\"{', '.join(options[:-1])} or {options[-1]}\"\n\ndef render_classification(text,options,answer):\n    example = 'text_A→text_B' if text.startswith('text_A:') else 'the following'\n    inputs = f'With no explanation, label {example} with either {render_options(options)}.\\n{text}'\n    targets = f\"{answer}.\"\n    return dict_of(inputs,targets)\n\ndef render_token_classification(tokens,options,labels):\n    prefix = f'With no explanation, label each line with {render_options(options)} preceded by \":\".\\n'\n    inputs = prefix+\"\\n\".join(tokens)\n    targets = \"\\n\".join([':'.join(x) for x in zip(tokens,labels)])\n    return dict_of(inputs,targets)\n\ndef render_multiple_choice(prompt, options, labels):\n    inputs=(prompt+'\\n' if prompt else '')\n    letters = string.ascii_uppercase[:len(options)]\n    inputs=f'With no explanation, chose the best option from {render_options(letters)}. {inputs}'    \n    for letter, option in zip(letters, options):\n        inputs+=f'\\n{letter}: {option}'\n    targets = f'{letters[labels]}.'\n    return dict_of(inputs, targets) \n\ndef negative_sample_options(y, labels,N=4):\n    if len(labels)<N:\n        return labels\n    else:\n        return [y]+random.sample([x for x in labels if x!=y], N-1)\n\ndef shuffle_choices(x):\n    choices = sorted([k for k in x if 'choice' in k])\n    choices_texts = [x[c] for c in choices]\n    correct_choice =choices_texts[x['labels']]\n    random.shuffle(choices_texts)\n    for c, ct in zip(choices, choices_texts):\n        x[c]=ct\n    x[\"labels\"]=choices_texts.index(correct_choice)\n    return x\n\ndef recast_dataset_classification_to_mc(dataset,sep=\"[SEP]\",N=4):\n\n    def recast_split(d,N=N):\n        labels = d.features['labels']\n        df=d.to_pandas()\n        df['inputs'] = df.sentence1\n        if \"sentence2\" in df:\n            df['inputs'] +=sep + df.sentence2\n\n        N=min(N, len(labels.names))\n        df['choices']=df.apply(lambda x:negative_sample_options(labels.int2str(x['labels']), labels.names,N),axis=1)     \n        df['labels']=df.apply(lambda x:x['choices'].index(labels.int2str(x['labels'])),axis=1)\n\n        for i in range(N):\n            df[f'choice{i}']= \"This example is \" + df.choices.map(lambda x:x[i])\n\n        choices = [f'choice{i}' for i in range(N)]\n        return Dataset.from_pandas(df[['inputs',*choices,'labels']],preserve_index=False)\n\n    return DatasetDict({k: recast_split(v) for k,v in dataset.items()})\n\n\ndef recast_instruct(dataset):\n    features = dataset['train'].features\n    labels = features['labels']\n\n    if \"sentence1\" in features:\n        task_type='Classification'\n    if \"choice0\" in features:\n        task_type = \"MultipleChoice\"\n    if \"tokens\" in features:\n        task_type = \"TokenClassification\"\n\n    def recast_MultipleChoice(x):\n        x=shuffle_choices(x)\n        choices = sorted([k for k in x if 'choice' in k])\n        if all([x[c] in x['inputs'] for c in choices]):\n            return {\"inputs\":x['inputs'], 'targets': x[f\"choice{x['labels']}\"].strip()+\".\"}\n        else:\n            return render_multiple_choice(x['inputs'],[x[c] for c in choices],x['labels'])\n\n    def recast_TokenClassification(x):\n        distractors = list(labels.feature.names)\n        x_labels = [labels.feature.int2str(y) for y in x['labels']]\n        labels_set= list({labels.feature.int2str(y) for y in x['labels']})\n        options=list(dict.fromkeys(labels_set+distractors))[:max(len(labels_set),10)]\n        return render_token_classification(x['tokens'],options,x_labels)\n\n    def recast_Classification(x):\n        if 'sentence2' in x:\n            text=f\"text_A: {x['sentence1']}\\ntext_B: {x['sentence2']}\"\n        else:\n            text=x['sentence1']\n            \n        answer=labels.int2str(x['labels']).strip()\n        options= negative_sample_options(answer, labels._int2str)\n        return render_classification(text, options, answer)\n        \n    dataset = dataset.map(eval(f\"recast_{task_type}\"))\n    dataset = dataset.remove_columns([k for k in features if k not in ['inputs','targets']])\n    return dataset\n "
  },
  {
    "path": "src/tasksource/.ipynb_checkpoints/tasks-checkpoint.py",
    "content": "from .preprocess import cat, get, regen, name, constant, Classification, TokenClassification, MultipleChoice\nfrom .metadata import bigbench_discriminative_english, blimp_hard, imppres_presupposition, imppres_implicature, udep_en_configs, udep_en_labels\nfrom datasets import get_dataset_config_names, Sequence, ClassLabel, Dataset, DatasetDict\n\n# variable name: dataset___config__task\n\n###################### NLI/paraphrase ###############################\n\nglue___mnli = Classification(sentence1=\"premise\", sentence2=\"hypothesis\", labels=\"label\", splits=[\"train\", None, \"validation_matched\"])\nglue___qnli = Classification(\"question\",\"sentence\", labels=\"label\")\nglue___rte = Classification(sentence1=\"sentence1\", sentence2=\"sentence2\", labels=\"label\")\nglue___wnli = Classification(sentence1=\"sentence1\", sentence2=\"sentence2\", labels=\"label\")\n#glue___ax = Classification(sentence1=\"premise\", sentence2=\"hypothesis\", labels=\"label\", splits=[\"test\", None, None]) # fully masked\n\nglue___mrpc = Classification(sentence1=\"sentence1\", sentence2=\"sentence2\", labels=\"label\")\nglue___qqp = Classification(sentence1=\"question1\", sentence2=\"question2\", labels=\"label\")\nglue___stsb = Classification(sentence1=\"sentence1\", sentence2=\"sentence2\", labels=\"label\")\n\nsuper_glue___boolq = Classification(sentence1=\"question\", labels=\"label\")\nsuper_glue___cb = Classification(sentence1=\"premise\", sentence2=\"hypothesis\", labels=\"label\")\nsuper_glue___multirc = Classification(\n    cat([\"paragraph\", \"question\"]),\n    'answer',\n    labels='label'\n)\n#super_glue___rte = Classification(sentence1=\"premise\", sentence2=\"hypothesis\", labels=\"label\") # in glue\nsuper_glue___wic = Classification(\n    sentence1=cat([\"word\",\"sentence1\"], \" : \"),\n    sentence2=cat([\"word\",\"sentence2\"], \" : \"),\n    labels='label'\n)\nsuper_glue___axg = Classification(sentence1=\"premise\", sentence2=\"hypothesis\", labels=\"label\", splits=[\"test\", None, None])\n\n\nanli__a1 = Classification('premise','hypothesis','label', splits=['train_r1','dev_r1','test_r1'])\nanli__a2 = Classification('premise','hypothesis','label', splits=['train_r2','dev_r2','test_r2'])\nanli__a3 = Classification('premise','hypothesis','label', splits=['train_r3','dev_r3','test_r3'])\n\n\nbabi_nli = Classification(\"premise\", \"hypothesis\", \"label\",\n    dataset_name=\"tasksource/babi_nli\",\n    config_name=set(get_dataset_config_names(\"tasksource/babi_nli\"))-{\"agents-motivations\"}\n) # agents-motivations task is not as clear-cut as the others\n\n\nsick__label         = Classification('sentence_A','sentence_B','label')\nsick__relatedness   = Classification('sentence_A','sentence_B','relatedness_score')\nsick__entailment_AB = Classification('sentence_A','sentence_B','entailment_AB')\n#sick__entailment_BA = Classification('sentence_A','sentence_B','entailment_BA')\n\ndef remove_neg_1(dataset):\n    return dataset.filter(lambda x:x['labels']!=-1)\n\nsnli = Classification(sentence1=\"premise\", sentence2=\"hypothesis\", labels=\"label\",\n    post_process=remove_neg_1)\n\nscitail = Classification(\"sentence1\",\"sentence2\",\"gold_label\",config_name=\"snli_format\")\n\nhans = Classification(sentence1=\"premise\", sentence2=\"hypothesis\", labels=\"label\")\n\nwanli = Classification('premise','hypothesis','gold', dataset_name=\"alisawuffles/WANLI\")\n\nrecast_nli = Classification(sentence1=\"context\", sentence2=\"hypothesis\", labels=\"label\", dataset_name=\"tasksource/recast\",\n    config_name=['recast_kg_relations', 'recast_puns', 'recast_factuality', 'recast_verbnet',\n    'recast_verbcorner', 'recast_ner', 'recast_sentiment', 'recast_megaveridicality'])\n\n\nprobability_words_nli = Classification(sentence1=\"context\", sentence2=\"hypothesis\", labels=\"label\",\n    dataset_name=\"sileod/probability_words_nli\", \n    config_name=[\"reasoning_1hop\",\"reasoning_2hop\",\"usnli\"])\n\nnan_nli = Classification(\"premise\", \"hypothesis\", \"label\", dataset_name=\"joey234/nan-nli\")\n\nnli_fever = Classification(\"premise\",\"hypothesis\",\"label\",\n    dataset_name=\"pietrolesci/nli_fever\", splits=[\"train\",\"dev\",None])\n\nbreaking_nli = Classification(\"sentence1\",\"sentence2\",\"label\",\n    dataset_name=\"pietrolesci/breaking_nli\", splits=[\"full\",None,None])\n\nconj_nli = Classification(\"premise\",\"hypothesis\",\"label\",post_process=remove_neg_1,\n    dataset_name=\"pietrolesci/conj_nli\",splits=['train','dev',None])\n\nfracas = Classification(\"premise\",\"hypothesis\",\"label\",\n    dataset_name=\"pietrolesci/fracas\")\n\ndialogue_nli = Classification(\"sentence1\",\"sentence2\",\"label\",\n    dataset_name=\"pietrolesci/dialogue_nli\")   \n\nmpe_nli = Classification(\"premise\",\"hypothesis\",\"label\",\n    dataset_name=\"pietrolesci/mpe\",\n    splits=[\"train\",\"dev\",\"test\"])  \n\ndnc_nli = Classification(\"context\",\"hypothesis\",\"label\",\n    dataset_name=\"pietrolesci/dnc\")\n\n# gpt3_nli = Classification(\"text_a\",\"text_b\",\"label\",dataset_name=\"pietrolesci/gpt3_nli\") # not sound enough\n\nrecast_white__fnplus = Classification(\"text\",\"hypothesis\",\"label\",\n    dataset_name=\"pietrolesci/recast_white\",splits=['fnplus',None,None])\nrecast_white__sprl = Classification(\"text\",\"hypothesis\",\"label\",\n    dataset_name=\"pietrolesci/recast_white\",splits=['sprl',None,None])\nrecast_white__dpr = Classification(\"text\",\"hypothesis\",\"label\",\n    dataset_name=\"pietrolesci/recast_white\",splits=['dpr',None,None])\n\njoci = Classification(\"context\",\"hypothesis\",\n    labels=lambda x: [None, \"impossible\", \"technically possible\", \"plausible\", \"likely\", \"very likely\"][x[\"original_label\"]],\n    pre_process=lambda ds:ds.filter(lambda x:x['original_label']!=0),\n    dataset_name=\"pietrolesci/joci\",splits=['full',None,None])\n\n#enfever_nli = Classification(\"evidence\",\"claim\",\"label\", dataset_name=\"ctu-aic/enfever_nli\")\n\nrobust_nli__IS_CS = Classification(\"premise\",\"hypothesis\",\"label\",\n\tdataset_name=\"pietrolesci/robust_nli\", splits=[\"IS_CS\",None,None])\nrobust_nli__LI_LI = Classification(\"premise\",\"hypothesis\",\"label\",\n\tdataset_name=\"pietrolesci/robust_nli\", splits=[\"LI_LI\",None,None])\nrobust_nli__ST_WO = Classification(\"premise\",\"hypothesis\",\"label\",\n\tdataset_name=\"pietrolesci/robust_nli\", splits=[\"ST_WO\",None,None])\nrobust_nli__PI_SP = Classification(\"premise\",\"hypothesis\",\"label\",\n\tdataset_name=\"pietrolesci/robust_nli\", splits=[\"PI_SP\",None,None])\nrobust_nli__PI_CD = Classification(\"premise\",\"hypothesis\",\"label\",\n\tdataset_name=\"pietrolesci/robust_nli\", splits=[\"PI_CD\",None,None])\nrobust_nli__ST_SE = Classification(\"premise\",\"hypothesis\",\"label\",\n\tdataset_name=\"pietrolesci/robust_nli\", splits=[\"ST_SE\",None,None])\nrobust_nli__ST_NE = Classification(\"premise\",\"hypothesis\",\"label\",\n\tdataset_name=\"pietrolesci/robust_nli\", splits=[\"ST_NE\",None,None])\nrobust_nli__ST_LM = Classification(\"premise\",\"hypothesis\",\"label\",\n\tdataset_name=\"pietrolesci/robust_nli\", splits=[\"ST_LM\",None,None])\nrobust_nli_is_sd = Classification(\"premise\",\"hypothesis\",\"label\",\n    dataset_name=\"pietrolesci/robust_nli_is_sd\")\nrobust_nli_li_ts = Classification(\"premise\",\"hypothesis\",\"label\",\n    dataset_name=\"pietrolesci/robust_nli_li_ts\")\n\ngen_debiased_nli__snli_seq_z = Classification(\"premise\",\"hypothesis\",\"label\",\n\tdataset_name=\"pietrolesci/gen_debiased_nli\", splits=[\"snli_seq_z\",None,None])\ngen_debiased_nli__snli_z_aug = Classification(\"premise\",\"hypothesis\",\"label\",\n\tdataset_name=\"pietrolesci/gen_debiased_nli\", splits=[\"snli_z_aug\",None,None])\ngen_debiased_nli__snli_par_z = Classification(\"premise\",\"hypothesis\",\"label\",\n\tdataset_name=\"pietrolesci/gen_debiased_nli\", splits=[\"snli_par_z\",None,None])\ngen_debiased_nli__mnli_par_z = Classification(\"premise\",\"hypothesis\",\"label\",\n\tdataset_name=\"pietrolesci/gen_debiased_nli\", splits=[\"mnli_par_z\",None,None])\ngen_debiased_nli__mnli_z_aug = Classification(\"premise\",\"hypothesis\",\"label\",\n\tdataset_name=\"pietrolesci/gen_debiased_nli\", splits=[\"mnli_z_aug\",None,None])\ngen_debiased_nli__mnli_seq_z = Classification(\"premise\",\"hypothesis\",\"label\",\n\tdataset_name=\"pietrolesci/gen_debiased_nli\", splits=[\"mnli_seq_z\",None,None])\n\nadd_one_rte = Classification(\"premise\",\"hypothesis\",\"label\",\n    dataset_name=\"pietrolesci/add_one_rte\",splits=[\"train\",\"dev\",\"test\"])\n\ndef _imppres_post_process(ds,prefix=''):\n    # imppres entailment definition is either purely semantic or purely pragmatic\n    # because of that, we assign differentiate the labels from anli/mnli notation\n    return ds.cast_column('labels', ClassLabel(\n    names=[f'{prefix}_entailment',f'{prefix}_neutral',f'{prefix}_contradiction']))\n\nimppres__presupposition = imppres__prag = Classification(\"premise\",\"hypothesis\",\"gold_label\",\n    dataset_name=\"tasksource/imppres\", config_name=imppres_presupposition,\n    post_process=_imppres_post_process)\n\nimppres__prag = Classification(\"premise\",\"hypothesis\",\"gold_label_prag\",\n    dataset_name=\"tasksource/imppres\", config_name=imppres_implicature,\n    post_process=lambda x: _imppres_post_process(x,'pragmatic'))\n\nimppres__log = Classification(\"premise\",\"hypothesis\",\"gold_label_log\",\n    dataset_name=\"tasksource/imppres\", config_name=imppres_implicature,\n    post_process=lambda x: _imppres_post_process(x,'logical'))\n\n\n#glue__diagnostics = Classification(\"premise\",\"hypothesis\",\"label\",\n#    dataset_name=\"pietrolesci/glue_diagnostics\",splits=[\"test\",None,None])\n\nhlgd = Classification(\"headline_a\", \"headline_b\", labels=\"label\")\n\npaws___labeled_final   = Classification(\"sentence1\", \"sentence2\", name('label',['not_paraphrase','paraphrase']))\npaws___labeled_swap    = Classification(\"sentence1\", \"sentence2\", name('label',['not_paraphrase','paraphrase']), splits=[\"train\", None, None])\n#paws___unlabeled_final = Classification(\"sentence1\", \"sentence2\", \"label\")\n\n#quora = Classification(get.questions.text[0], get.questions.text[1], 'is_duplicate') # in glue\nmedical_questions_pairs = Classification(\"question_1\",\"question_2\", name(\"label\",['not similar','similar']))\n \n###################### Token Classification #########################\n\nconll2003__pos_tags   = TokenClassification(tokens=\"tokens\", labels='pos_tags')\nconll2003__chunk_tags = TokenClassification(tokens=\"tokens\", labels='chunk_tags')\nconll2003__ner_tags   = TokenClassification(tokens=\"tokens\", labels='ner_tags')\n\n#tner___tweebank_ner    = TokenClassification(tokens=\"tokens\", labels=\"tags\")\n\n######################## Multiple choice ###########################\n\n\nmodel_written_evals = MultipleChoice('question', choices=['answer_matching_behavior','answer_not_matching_behavior'], labels=constant(0),  \n    dataset_name=\"Anthropic/model-written-evals\")\n\ntruthful_qa___multiple_choice = MultipleChoice(\n    \"question\",\n    choices_list=get.mc1_targets.choices,\n    labels=constant(0)\n)\n\nfig_qa = MultipleChoice(\n    \"startphrase\",\n    choices=[\"ending1\",\"ending2\"],\n    labels=\"labels\",\n    dataset_name=\"nightingal3/fig-qa\",\n    splits=[\"train\",\"validation\",None]\n)\n\nbigbench = MultipleChoice(\n    'inputs',\n    choices_list='multiple_choice_targets',\n    labels=lambda x:x['multiple_choice_scores'].index(1) if 1 in ['multiple_choice_scores'] else -1,\n    dataset_name='tasksource/bigbench',\n    config_name=bigbench_discriminative_english - {\"social_i_qa\",\"intersect_geometry\"} # english multiple choice tasks, minus duplicates\n)\n#\"goal_step_wikihow\"\n\nblimp_hard = MultipleChoice(inputs=constant(''),\n    choices=['sentence_good','sentence_bad'],\n    labels=constant(0),\n    dataset_name=\"blimp\",\n    config_name=blimp_hard # tasks where GPT2 is at least 10% below  human accuracy\n)\n\ncos_e = MultipleChoice('question',\n    choices_list='choices',\n    labels= lambda x: x['choices_list'].index(x['answer']),\n    config_name='v1.0')\n\ncosmos_qa = MultipleChoice(cat(['context','question']),regen('answer[0-3]'),'label')\n\ndream = MultipleChoice(\n    lambda x:\"\\n\".join(x['dialogue']+[x['question']]),\n    choices_list='choice',\n    labels=lambda x:x['choices_list'].index(x['answer'])\n)\n\nopenbookqa = MultipleChoice(\n    'question_stem',\n    choices_list=get.choices.text,\n    labels='answerKey'\n)\n\nqasc = MultipleChoice(\n    'question',\n    choices_list=get.choices.text,\n    labels=lambda x: \"ABCDEFGH\".index(x['answerKey']),\n    splits=['train','validation',None]\n    \n)\n\nquartz = MultipleChoice(\n    'question',\n    choices_list=get.choices.text,\n    labels='answerKey'\n)\nquail = MultipleChoice(\n    cat(['context','question']),\n    choices_list='answers',\n    labels='correct_answer_id' \n)\n\nhead_qa___en = MultipleChoice(\"qtext\",\n    choices_list = lambda x:[a['atext'] for a in x[\"answers\"]],\n    labels = lambda x:[a['aid'] for a in x[\"answers\"]].index(x[\"ra\"])\n)\n\n\nsciq = MultipleChoice(\n    'question',\n    ['correct_answer']+regen('distractor[1-3]'),\n    labels=constant(0))\n\nsocial_i_qa = MultipleChoice(\n    'question',\n    ['answerA','answerB','answerC'],\n    'label')\n\nwiki_hop___original = MultipleChoice(\n    'question', \n    choices_list='candidates',\n    labels=lambda x:x['choices_list'].index(x[\"answer\"]))\n\nwiqa = MultipleChoice('question_stem',\n    choices_list = lambda x: x['choices']['text'],\n    labels='answer_label_as_choice')\n\npiqa = MultipleChoice('goal', choices=['sol1','sol2'], labels='label')\n\nhellaswag = MultipleChoice('ctx_a',\n    choices_list=lambda x: [f'{x[\"ctx_b\"]}{e}' for e in x[\"endings\"]],\n    labels='label', splits=['train','validation',None])\n\nsuper_glue___copa = MultipleChoice('premise',['choice1','choice2'],'label')\n\nbalanced_copa = MultipleChoice('premise',['choice1','choice2'],'label',\n    dataset_name=\"pkavumba/balanced-copa\")\n\ne_care = MultipleChoice('premise',['choice1','choice2'],'label',\n    dataset_name=\"12ml/e-CARE\")\n\nart = MultipleChoice(cat(['hypothesis_1','hypothesis_2']),\n    ['observation_1','observation_2'],\n    labels=lambda x:x['label']-1,\n    splits=['train','validation',None]\n)\n\n\nmmlu = MultipleChoice('question',labels='answer',choices_list='choices',splits=['validation','dev','test'],\n    dataset_name=\"tasksource/mmlu\",\n    config_name=get_dataset_config_names(\"tasksource/mmlu\")\n)\n\nwinogrande = MultipleChoice('sentence',['option1','option2'],'answer',config_name='winogrande_xl',\n    splits=['train','validation',None])\n\ncodah = MultipleChoice('question_propmt',choices_list='candidate_answers',labels='correct_answer_idx',config_name='codah')\n\nai2_arc__challenge = MultipleChoice('question',\n    choices_list=get.choices.text,  \n    labels=lambda x: get.choices.label(x).index(x[\"answerKey\"]),\n    config_name=[\"ARC-Challenge\",\"ARC-Easy\"])\n\ndefinite_pronoun_resolution = MultipleChoice(\n    inputs=cat([\"sentence\",\"pronoun\"],' : '),\n    choices_list='candidates',\n    labels=\"label\",\n    splits=['train',None,'test'])\n\nswag___regular=MultipleChoice(cat([\"sent1\",\"sent2\"]),regen(\"ending[0-3]\"),\"label\")\n\ndef _split_choices(s):\n    import re\n    return [x.rstrip(', ') for x in re.split(r'[a-e] \\) (.*?)',s) if x.strip(', ')]\n\nmath_qa = MultipleChoice(\n    'Problem', \n    choices_list = lambda x: _split_choices(x['options']),\n    labels = lambda x:'abcde'.index(x['correct'])   \n)\n\n#aqua_rat___tokenized = MultipleChoice(\"question\",choices_list=\"options\",labels=lambda x:\"ABCDE\".index(x['correct'])) in math_qa\n\n\n######################## Classification (other) ########################\nglue___cola = Classification(sentence1=\"sentence\", labels=\"label\")\nglue___sst2 = Classification(sentence1=\"sentence\", labels=\"label\")\n\nutilitarianism = Classification(\"comparison\",labels=\"label\",\ndataset_name=\"metaeval/utilitarianism\")\n\namazon_counterfactual = Classification(\n    \"text\", labels=\"label\",\n    dataset_name=\"mteb/amazon_counterfactual\",\n    config_name=\"en\")\n\ninsincere_questions = Classification(\n    \"text\", labels=\"label_text\",\n    dataset_name=\"SetFit/insincere-questions\")\n\ntoxic_conversations = Classification(\n    \"text\", labels=\"label\",\n    dataset_name=\"SetFit/toxic_conversations\")\n\nturingbench = Classification(\"Generation\",labels=\"label\",\n    dataset_name=\"turingbench/TuringBench\",\n    splits=[\"train\",\"validation\",None])\n\n\ntrec = Classification(sentence1=\"text\", labels=\"fine_label\")\n\ntals_vitaminc = Classification('claim','evidence','label', dataset_name=\"tals/vitaminc\")\n\nhope_edi = Classification(\"text\", labels=\"label\", splits=[\"train\", \"validation\", None], config_name=[\"english\"])\n\n#fever___v1_0 = Classification(sentence1=\"claim\", labels=\"label\", splits=[\"train\", \"paper_dev\", \"paper_test\"], dataset_name=\"fever\", config_name=\"v1.0\")\n#fever___v2_0 = Classification(sentence1=\"claim\", labels=\"label\", splits=[None, \"validation\", None], dataset_name=\"fever\", config_name=\"v2.0\")\n\nrumoureval_2019 = Classification(\n    sentence1=\"source_text\",\n    sentence2=lambda x: str(x[\"reply_text\"]),\n    labels=\"label\", dataset_name=\"strombergnlp/rumoureval_2019\", config_name=\"RumourEval2019\",\n    post_process=lambda ds:ds.filter(lambda x:x['labels']!=None)    \n)\n\nethos___binary = Classification(sentence1=\"text\", labels=\"label\", splits=[\"train\", None, None])\nethos___multilabel = Classification(\n    'text',\n    labels=lambda x: [x[c] for c in\n    ['violence', 'gender', 'race', 'national_origin', 'disability', 'religion', 'sexual_orientation','directed_vs_generalized']\n    ],\n    splits=[\"train\", None, None]\n)\n\ntweet_eval = Classification(sentence1=\"text\", labels=\"label\",\n    config_name=[\"emoji\", \"emotion\", \"hate\", \"irony\", \"offensive\", \"sentiment\"])\n\ndef stance_kwargs(topic):\n    return {\n        \"sentence1\": constant(f'Topic: {topic}. \\n Opinion:\\n'), \n        \"sentence2\": \"text\", \n        \"labels\": \"label\", \n        \"config_name\": f\"stance_{topic.lower()}\",\n        \"dataset_name\": \"tweet_eval\"\n    }\n\ntweet_eval_abortion = Classification(**stance_kwargs(\"abortion\"))\ntweet_eval_atheism  = Classification(**stance_kwargs(\"atheism\"))\ntweet_eval_climate  = Classification(**stance_kwargs(\"climate\"))\ntweet_eval_feminist = Classification(**stance_kwargs(\"feminist\"))\ntweet_eval_hillary  = Classification(**stance_kwargs(\"Hillary\"))\n\n\ndiscovery = Classification(\"sentence1\", \"sentence2\", labels=\"label\", config_name=[\"discovery\"])\n\npragmeval_1 = Classification(\"sentence\",labels=\"label\",\n    dataset_name=\"pragmeval\",\n    config_name= [\"emobank-arousal\", \"emobank-dominance\", \"emobank-valence\", \"squinky-formality\", \"squinky-implicature\", \n    \"squinky-informativeness\",\"switchboard\",\"mrda\",\"verifiability\"])\n\npragmeval_2 = Classification(\"sentence1\",\"sentence2\",labels=\"label\",\n    dataset_name=\"pragmeval\",\n    config_name= [\"emergent\", \"gum\", \"pdtb\", \"persuasiveness-claimtype\", \n    \"persuasiveness-eloquence\", \"persuasiveness-premisetype\", \"persuasiveness-relevance\", \"persuasiveness-specificity\", \n    \"persuasiveness-strength\", \"sarcasm\",\"stac\"])\n\nsilicone = Classification(\"Utterance\",labels=\"Label\",\n    config_name=['dyda_da', 'dyda_e', 'iemocap', 'maptask', 'meld_e', 'meld_s', 'oasis', 'sem'] # +['swda', 'mrda'] # in pragmeval\n)\n\nlex_glue___eurlex = Classification(sentence1=\"text\", labels=\"labels\") \nlex_glue___scotus = Classification(sentence1=\"text\", labels=\"label\")\nlex_glue___ledgar = Classification(sentence1=\"text\", labels=\"label\")\nlex_glue___unfair_tos = Classification(sentence1=\"text\", labels=\"labels\")\nlex_glue___case_hold = MultipleChoice(\"context\", choices_list='endings', labels=\"label\")\n\nlanguage_identification = Classification(\"text\",labels=\"labels\", dataset_name=\"papluca/language-identification\")\n\n################ Automatically generated (verified)##########\n\nimdb = Classification(sentence1=\"text\", labels=\"label\", splits=[\"train\", None, \"test\"])\n\nrotten_tomatoes = Classification(sentence1=\"text\", labels=\"label\")\n\nag_news = Classification(sentence1=\"text\", labels=\"label\", splits=[\"train\", None, \"test\"])\n\nyelp_review_full = Classification(sentence1=\"text\", labels=\"label\", splits=[\"train\", None, \"test\"], config_name=[\"yelp_review_full\"])\n\nfinancial_phrasebank = Classification(sentence1=\"sentence\", labels=\"label\", splits=[\"train\", None, None],\n    config_name=[\"sentences_allagree\"])\n\npoem_sentiment = Classification(sentence1=\"verse_text\", labels=\"label\")\n\n#emotion = Classification(sentence1=\"text\", labels=\"label\") # file not found\n\ndbpedia_14 = Classification(sentence1=\"content\", labels=\"label\", splits=[\"train\", None, \"test\"], config_name=[\"dbpedia_14\"])\n\namazon_polarity = Classification(sentence1=\"content\", labels=\"label\", splits=[\"train\", None, \"test\"], config_name=[\"amazon_polarity\"])\n\napp_reviews = Classification(\"review\", labels=\"star\", splits=[\"train\", None, None])\n\n# multi_nli = Classification(sentence1=\"premise\", sentence2=\"hypothesis\", labels=\"label\", splits=[\"train\", \"validation_matched\", None]) #glue\n\nhate_speech18 = Classification(sentence1=\"text\", labels=\"label\", splits=[\"train\", None, None])\n\nsms_spam = Classification(sentence1=\"sms\", labels=\"label\", splits=[\"train\", None, None])\n\nhumicroedit___subtask_1 = Classification(\"original\", \"edit\", labels=\"meanGrade\", dataset_name=\"humicroedit\", config_name=\"subtask-1\")\nhumicroedit___subtask_2 = Classification(\n    sentence1=cat(['original1','edit1'],' : '),\n    sentence2=cat(['original2','edit2'],' : '),\n    labels=\"label\", dataset_name=\"humicroedit\", config_name=\"subtask-2\")\n\nsnips_built_in_intents = Classification(sentence1=\"text\", labels=\"label\", splits=[\"train\", None, None])\n\nbanking77 = Classification(sentence1=\"text\", labels=\"label\", splits=[\"train\", None, \"test\"])\n\nhate_speech_offensive = Classification(sentence1=\"tweet\", labels=\"class\", splits=[\"train\", None, None])\n\nyahoo_answers_topics = Classification(\n    \"question_title\",\"question_content\",labels=\"topic\")\n\nstackoverflow_questions=Classification(\"title\",\"body\",labels=\"label\",\n    dataset_name=\"pacovaldez/stackoverflow-questions\")\n\n#hyperpartisan_news_detection___byarticle = Classification(sentence1=\"text\", labels=\"hyperpartisan\", splits=[\"train\", None, None]) # files too heavy\n#hyperpartisan_news_detection___bypublisher = Classification(sentence1=\"text\", labels=\"hyperpartisan\", splits=[\"train\",\"validation\", None]) # files too heavy\n\nhyperpartisan_news = Classification(\n    \"text\",\n    labels=lambda x: {'true':'hyperpartisan','false':'not_hyperpartisan'}.get(x[\"label\"]),\n    dataset_name=\"zapsdcn/hyperpartisan_news\")\n\nscierc = Classification(\"text\",labels=\"label\",dataset_name=\"zapsdcn/sciie\")\ncitation_intent = Classification(\"text\",labels=\"label\",dataset_name=\"zapsdcn/citation_intent\")\n\n#go_emotions___raw = Classification(sentence1=\"text\", splits=[\"train\", None, None])\ngo_emotions___simplified = Classification(sentence1=\"text\", labels=\"labels\")\n\n#boolq = Classification(sentence1=\"question\", splits=[\"train\", \"validation\", None]) # in superglue\n\n#ecthr_cases___alleged_violation_prediction = Classification(labels=\"labels\", dataset_name=\"ecthr_cases\", config_name=\"alleged-violation-prediction\")\n#ecthr_cases___violation_prediction = Classification(labels=\"labels\", dataset_name=\"ecthr_cases\", config_name=\"violation-prediction\")\n#   too long\n\nscicite = Classification(sentence1=\"string\", labels=\"label\",dataset_name=\"allenai/scicite\")\n\nliar = Classification(sentence1=\"statement\", labels=\"label\")\n\nrelbert_lexical_relation_classification = Classification(sentence1=\"head\", sentence2=\"tail\", labels=\"relation\",\n dataset_name=\"relbert/lexical_relation_classification\",\n config_name=[\"BLESS\",\"CogALexV\",\"EVALution\",\"K&H+N\",\"ROOT09\"])\n\n\nlinguisticprobing = Classification(\"sentence\", labels=\"label\", dataset_name=\"tasksource/linguisticprobing\", \n    config_name=['subj_number',\n                'obj_number',\n                'past_present',\n                'sentence_length',\n                'top_constituents',\n                'tree_depth',\n                'coordination_inversion',\n                'odd_man_out',\n                'bigram_shift']#+['word_content'] #too many labels \n)\n\ncrowdflower = Classification(\"text\", labels=\"label\",\n splits=[\"train\", None, None], dataset_name=\"tasksource/crowdflower\",\n config_name=['sentiment_nuclear_power',\n            'tweet_global_warming',\n            'airline-sentiment',\n            'corporate-messaging',\n            'economic-news',\n            'political-media-audience',\n            'political-media-bias',\n            'political-media-message',\n            'text_emotion']\n)\n\nethics___commonsense = Classification(sentence1=\"text\", labels=\"label\", dataset_name=\"metaeval/ethics\", config_name=\"commonsense\")\nethics___deontology = Classification(sentence1=\"text\", labels=\"label\", dataset_name=\"metaeval/ethics\", config_name=\"deontology\")\nethics___justice = Classification(sentence1=\"text\", labels=\"label\", dataset_name=\"metaeval/ethics\", config_name=\"justice\")\nethics___virtue = Classification(sentence1=\"sentence1\", sentence2=\"sentence2\", labels=\"label\", dataset_name=\"metaeval/ethics\", config_name=\"virtue\")\n\nemo = Classification(sentence1=\"text\", labels=\"label\", splits=[\"train\", None, \"test\"], config_name=[\"emo2019\"])\n\ngoogle_wellformed_query = Classification(sentence1=\"content\", labels=\"rating\")\n\ntweets_hate_speech_detection = Classification(sentence1=\"tweet\", labels=\"label\", splits=[\"train\", None, None])\n\n#adv_glue___adv_sst2 = Classification(sentence1=\"sentence\", labels=\"label\", splits=[\"validation\", None, None])\n#adv_glue___adv_qqp = Classification(sentence1=\"question1\", sentence2=\"question2\", labels=\"label\", splits=[\"validation\", None, None])\n#adv_glue___adv_mnli = Classification(sentence1=\"premise\", sentence2=\"hypothesis\", labels=\"label\", splits=[\"validation\", None, None])\n#adv_glue___adv_mnli_mismatched = Classification(sentence1=\"premise\", sentence2=\"hypothesis\", labels=\"label\", splits=[\"validation\", None, None])\n#adv_glue___adv_qnli = Classification(sentence1=\"question\", labels=\"label\", splits=[\"validation\", None, None])\n#adv_glue___adv_rte = Classification(sentence1=\"sentence1\", sentence2=\"sentence2\", labels=\"label\", splits=[\"validation\", None, None])\n\nhas_part = Classification(\"arg1\",\"arg2\", labels=\"score\", splits=[\"train\", None, None])\n\nwnut_17 = TokenClassification(tokens=\"tokens\", labels=\"ner_tags\", config_name=[\"wnut_17\"])\n\nncbi_disease = TokenClassification(tokens=\"tokens\", labels=\"ner_tags\", config_name=[\"ncbi_disease\"])\n\nacronym_identification = TokenClassification(labels=\"labels\", tokens=\"tokens\")\n\njnlpba = TokenClassification(tokens=\"tokens\", labels=\"ner_tags\", splits=[\"train\", \"validation\", None], config_name=[\"jnlpba\"])\n\n#species_800 = TokenClassification(tokens=\"tokens\", labels=\"ner_tags\", config_name=[\"species_800\"]) missing files\n\nSpeedOfMagic_ontonotes_english = TokenClassification(tokens=\"tokens\", labels=\"ner_tags\", dataset_name=\"SpeedOfMagic/ontonotes_english\", config_name=\"SpeedOfMagic--ontonotes_english\")\n\nblog_authorship_corpus__gender    = Classification(sentence1=\"text\",labels=\"gender\")\nblog_authorship_corpus__age       = Classification(sentence1=\"text\",labels=\"age\")\n#blog_authorship_corpus__horoscope = Classification(sentence1=\"text\",labels=\"horoscope\")\nblog_authorship_corpus__job       = Classification(sentence1=\"text\",labels=\"job\")\n\nlaunch_open_question_type = Classification(sentence1=\"question\", labels=\"resolve_type\", dataset_name=\"launch/open_question_type\")\n\nhealth_fact = Classification(sentence1=\"claim\", labels=\"label\",\n    pre_process = lambda ds:ds.filter(lambda x:x['label'] not in {-1})\n)\n\ncommonsense_qa = MultipleChoice(\n    \"question\",\n    choices_list=get.choices.text,\n    labels=lambda x: \"ABCDE\".index(x[\"answerKey\"]),\n    splits=[\"train\",\"validation\",None]\n)\nmc_taco = Classification(\n    lambda x: f'{x[\"sentence\"]} {x[\"question\"]} {x[\"answer\"]}',\n    labels=\"label\",\n    splits=[ \"validation\",None,\"test\"]\n)\n\nade_corpus_v2___Ade_corpus_v2_classification = Classification(\"text\",labels=\"label\")\n\ndiscosense = MultipleChoice(\"context\",choices=regen(\"option\\_[0-3]\"),labels=\"label\",\n    dataset_name=\"prajjwal1/discosense\")\n    \ncirca = Classification(\n    sentence1=cat([\"context\",\"question-X\"]),\n    sentence2=\"answer-Y\",\n    labels=\"goldstandard2\", post_process=remove_neg_1)\n\n#code_x_glue_cc_defect_detection = Classification(\"func\", labels=\"target\")\n\n#code_x_glue_cc_clone_detection_big_clone_bench = Classification(\"func1\", \"func2\", \"label\") # in bigbench + too heavy (100g)\n\n#code_x_glue_cc_code_refinement = MultipleChoice(\n#    constant(\"\"), choices=[\"buggy\",\"fixed\"], labels=constant(0),\n#    config_name=\"medium\")\n\n#effective_feedback_student_writing = Classification(\"discourse_text\", \n#labels=\"discourse_effectiveness\",dataset_name=\"YaHi/EffectiveFeedbackStudentWriting\")\n# discontinued /!\\\n\n#promptSentiment = Classification(\"text\",labels=\"label\",dataset_name=\"Ericwang/promptSentiment\")\n#promptNLI = Classification(\"premise\",\"hypothesis\",labels=\"label\",dataset_name=\"Ericwang/promptNLI\")\n#promptSpoke = Classification(\"text\",labels=\"label\",dataset_name=\"Ericwang/promptSpoke\")\n#promptProficiency = Classification(\"text\",labels=\"label\",dataset_name=\"Ericwang/promptProficiency\")\n#promptGrammar = Classification(\"text\",labels=\"label\",dataset_name=\"Ericwang/promptGrammar\")\n#promptCoherence = Classification(\"text\",labels=\"label\",dataset_name=\"Ericwang/promptCoherence\")\n\nphrase_similarity = Classification(\n    sentence1=cat([\"phrase1\",\"sentence1\"], \" : \"),\n    sentence2=cat([\"phrase2\",\"sentence2\"], \" : \"),\n    labels='label',\n    dataset_name=\"PiC/phrase_similarity\"\n)\n\nexaggeration_detection = Classification(\n    sentence1=\"press_release_conclusion\",\n    sentence2=\"abstract_conclusion\",\n    labels=\"exaggeration_label\", \n    dataset_name=\"copenlu/scientific-exaggeration-detection\"\n)\nquarel = Classification(\n    \"question\",\n    labels=lambda x: \"AB\"[x[\"answer_index\"]]\n)\n\nmwong_fever_evidence_related = Classification(sentence1=\"claim\", sentence2=\"evidence\", labels=name(\"labels\",['unrelated','related']),\n    splits=[\"train\", \"valid\", \"test\"], dataset_name=\"mwong/fever-evidence-related\")\n\nnumer_sense = Classification(\"sentence\",labels=\"target\",splits=[\"train\",None,None])\n\ndynasent__r1 = Classification(\"sentence\", labels=\"gold_label\", \n    dataset_name=\"dynabench/dynasent\", config_name=\"dynabench.dynasent.r1.all\")\ndynasent__r2 = Classification(\"sentence\", labels=\"gold_label\", \n    dataset_name=\"dynabench/dynasent\", config_name=\"dynabench.dynasent.r2.all\")\n\nsarcasm_news = Classification(\"headline\", labels=\"is_sarcastic\",\n    dataset_name=\"raquiba/Sarcasm_News_Headline\")\n\nsem_eval_2010_task_8 = Classification(\"sentence\",labels=\"relation\")\n\nauditor_review = Classification(sentence1=\"sentence\",\n    labels=name(\"label\",['negative','neutral','positive']),\n    dataset_name=\"demo-org/auditor_review\")\n\nmedmcqa = MultipleChoice(\"question\", choices=regen('op[a-d]'),labels='cop')\n\n\ndynasent_disagreement    = Classification(\"text\", labels=\"binary_disagreement\", dataset_name=\"RuyuanWan/Dynasent_Disagreement\")\npoliteness_disagreement  = Classification(\"text\", labels=\"binary_disagreement\", dataset_name=\"RuyuanWan/Politeness_Disagreement\")\nsbic_disagreement        = Classification(\"text\", labels=\"binary_disagreement\", dataset_name=\"RuyuanWan/SBIC_Disagreement\")\nschem_disagreement       = Classification(\"text\", labels=\"binary_disagreement\", dataset_name=\"RuyuanWan/SChem_Disagreement\")\ndilemmas_disagreement    = Classification(\"text\", labels=\"binary_disagreement\", dataset_name=\"RuyuanWan/Dilemmas_Disagreement\")\n\nlogiqa = MultipleChoice(\n    cat([\"context\",\"query\"]),\n    choices_list = 'options',\n    labels = \"correct_option\",\n    dataset_name=\"lucasmccabe/logiqa\"\n)\n\n#proto_qa = MultipleChoice(\n#    \"question\",\n#    choices_list=lambda x:x['answer-clusters']['answers'],\n#    labels=lambda x: x['answer-clusters']['count'].index(max(x['answer-clusters']['count'])),\n#    config_name='proto_qa'\n#)\n\nwiki_qa = Classification(\"question\",\"answer\", name(\"label\",['False','True']))\n\ncycic_classification = Classification(\"question\",labels=name(\"correct_answer\",['False','True']),\n    dataset_name = \"tasksource/cycic_classification\")\ncycic_mc = MultipleChoice(\"question\", choices=regen('answer\\_option[0-4]'), labels=\"correct_answer\",\n    dataset_name = \"tasksource/cycic_multiplechoice\")\n\n\ndef _preprocess_chatgpt_detection(ex):\n    import random\n    label=random.random()<0.5\n    ex['label']=int(label)\n    ex['answer']=[str(ex['human_answers'][0]),str(ex['chatgpt_answers'][0])][label]\n    return ex\n\n#chatgpt_detection = Classification(\"question\",\"answer\",\"label\",\n#    dataset_name = 'Hello-SimpleAI/HC3', config_name=\"all\",\n#    pre_process=lambda dataset:dataset.map(_preprocess_chatgpt_detection))\n\nsts_companion = Classification(\"sentence1\",\"sentence2\",\"label\",\n    dataset_name=\"tasksource/sts-companion\")\n\ncommonsense_qa_2 = Classification(\"question\",labels=\"answer\",\n    dataset_name=\"tasksource/commonsense_qa_2.0\")\n\nling_nli = Classification(\"premise\",\"hypothesis\",\"label\",dataset_name=\"tasksource/lingnli\")\n\nmonotonicity_entailment = Classification(\"sentence1\", \"sentence2\", \"gold_label\",    \n    dataset_name=\"tasksource/monotonicity-entailment\")\n\narct = MultipleChoice(cat([\"reason\",\"claim\"]),choices=[\"warrant0\",\"warrant1\"],\n    labels=\"correctLabelW0orW1\", dataset_name=\"tasksource/arct\")\n\nscinli = Classification(\"sentence1\", \"sentence2\", labels=\"label\",\n    post_process=lambda x:x.shuffle(seed=0),\n    dataset_name=\"tasksource/scinli\")\n\nnaturallogic = Classification(\" sent1 \",\" sent2 \",\" new_label \",dataset_name=\"tasksource/naturallogic\")\n\nonestop_qa = MultipleChoice(cat([\"paragraph\",\"question\"]),choices_list=\"answers\",\n    labels=constant(0))\n\nmoral_stories = MultipleChoice(cat([\"situation\",\"intention\"]),\n    choices=['moral_action',\"immoral_action\"],labels=constant(0),\n    dataset_name=\"demelin/moral_stories\", config_name=\"full\")\n\nprost = MultipleChoice(cat([\"context\",\"ex_question\"]), choices=['A','B','C','D'],labels=\"label\",\n    dataset_name=\"corypaik/prost\")\n\ndyna_hate = Classification(\"text\",labels=\"label\",dataset_name=\"aps/dynahate\",splits=['train',None,None])\n\nsyntactic_augmentation_nli = Classification('sentence1',\"sentence2\",\"gold_label\",dataset_name=\"metaeval/syntactic-augmentation-nli\")\n\nautotnli = Classification(\"premises\", \"hypothesis\", \"label\", dataset_name=\"tasksource/autotnli\")\n#equate = Classification(\"sentence1\", \"sentence2\", \"gold_label\",dataset_name=\"metaeval/equate\")\n\nconqada = Classification(\"sentence1\",\"sentence2\",\"label\",dataset_name=\"lasha-nlp/CONDAQA\",\n    pre_process = lambda ds:ds.filter(lambda x:x['label'] in {\"DON'T KNOW\",\"YES\",\"NO\"})\n)\n\nwebgbpt_comparisons = MultipleChoice(get.question.full_text, choices=['answer_0','answer_1'],\n    labels=lambda x:int(x['score_1']>0),\n    dataset_name=\"openai/webgpt_comparisons\")\n\nsynthetic_instruct = MultipleChoice('prompt', choices=['chosen', 'rejected'],\n    labels=constant(0), dataset_name=\"Dahoas/synthetic-instruct-gptj-pairwise\")\n\nscruples = Classification(\"text\",labels=\"binarized_label\",dataset_name=\"metaeval/scruples\")\n\nwouldyourather = MultipleChoice(constant('Most people would rather:'), choices=['option_a','option_b'],\n    labels= lambda x: int(x['votes_a']<x['votes_b']),\n    dataset_name=\"metaeval/wouldyourather\")\n\n#attempto_nli = Classification(\"premise\",\"hypothesis\",\n#    lambda x:f'race-{x[\"race_label\"]}',\n#    dataset_name=\"sileod/attempto-nli\")\n\ndefeasible_nli = Classification(cat([\"Premise\",\"Hypothesis\"]),\"Update\",labels=\"UpdateType\",\n    dataset_name=\"metaeval/defeasible-nli\",config_name=['atomic', 'snli'])\n\n#defeasible_nli_social = Classification(cat([\"SocialChemROT\",\"Hypothesis\"]),\"Update\",labels=\"UpdateType\",\n#    dataset_name=\"metaeval/defeasible-nli\",config_name='social')\n\nhelp_nli = Classification(\"ori_sentence\",\"new_sentence\",\"gold_label\",\n    dataset_name=\"tasksource/help-nli\")\n    \nnli_veridicality_transitivity = Classification(\"sentence1\",\"sentence2\",\"gold_label\",\n    dataset_name=\"metaeval/nli-veridicality-transitivity\")\n\nlonli = Classification(\"premise\",\"hypothesis\",\"label\",\n    dataset_name=\"tasksource/lonli\")\n\ndadc_limit = Classification(\"sentence1\",\"sentence2\",\"label\",\n    dataset_name=\"tasksource/dadc-limit-nli\")\n\nflute = Classification(\"premise\",\"hypothesis\",\"label\",\n    dataset_name=\"ColumbiaNLP/FLUTE\")\n\nstrategy_qa = Classification('question',labels='answer',\n    dataset_name=\"tasksource/strategy-qa\",splits=['train',None,None])\n\nsummarize_from_feedback = MultipleChoice(get.info.post,\n    choices_list=lambda x: [x['summaries'][0]['text'],x['summaries'][1]['text']],\n    labels=\"choice\",\n    dataset_name=\"openai/summarize_from_feedback\", config_name=\"comparisons\",\n    pre_process = lambda ds:ds.filter(lambda x: type(get.info.post(x))==str)\n)\n\nfolio = Classification(\"premises\",\"conclusion\",\n    labels=lambda x:{'False':'contradiction','True':'entailment', 'Uncertain':'neutral'}.get(x[\"label\"]),\n    dataset_name=\"tasksource/folio\")\n\ntomi_nli = Classification(\"premise\",\"hypothesis\",\"label\",\n    dataset_name=\"tasksource/tomi-nli\")\n\navicenna = Classification(\"Premise 1\",\"Premise 2\",\"Syllogistic relation\",\n    dataset_name=\"tasksource/avicenna\")\n\nshp = MultipleChoice(\"history\",\n    choices=['human_ref_A','human_ref_B'],\n    labels=\"labels\",\n    dataset_name=\"stanfordnlp/SHP\")\n\nmedqa_usmle = MultipleChoice('sent1',choices=regen('ending[0-3]'),labels='label',\n    dataset_name=\"GBaker/MedQA-USMLE-4-options-hf\")\n\nwikimedqa = MultipleChoice(\"text\",choices=regen('option\\_[0-7]'),labels='label',\n    dataset_name=\"sileod/wikimedqa\",\n    config_name=[\"medwiki\"])\n\ncicero = MultipleChoice(lambda x: \" \".join(x['Dialogue']),\n    choices_list=\"Choices\", labels=lambda x:x['Human Written Answer'][0],\n    dataset_name=\"declare-lab/cicero\")\n\ncreak = Classification(\"sentence\",labels=\"label\",\n    dataset_name='amydeng2000/CREAK')\n\nmutual = MultipleChoice(\"article\",choices_list=\"options\",\n    labels=lambda x: \"ABCD\".index(x['answers']),\n    dataset_name=\"tasksource/mutual\",splits=[\"train\",None,None])\n\nneqa = MultipleChoice('prompt',choices_list='classes',labels=\"answer_index\",\n    dataset_name=\"inverse-scaling/NeQA\")\nquote_repetition = MultipleChoice('prompt',choices_list='classes',labels=\"answer_index\",\n    dataset_name=\"inverse-scaling/quote-repetition\")\nredefine_math = MultipleChoice('prompt',choices_list='classes',labels=\"answer_index\",\n    dataset_name=\"inverse-scaling/redefine-math\")\n\npuzzte = Classification(\"puzzle_text\",\"question\",\"answer\",\n    dataset_name=\"tasksource/puzzte\")\n\nimplicatures = MultipleChoice(cat(['context','response'],\"\\n\"),\n    choices=['correct_implicature','incorrect_implicature'],\n    labels=constant(0),\n    dataset_name='tasksource/implicatures')\n\nrace = MultipleChoice(cat(['question','article'],'\\n'), choices_list='options',\n    labels=lambda x:'ABCDE'.index(x['answer']),\n    config_name=['middle','high'])\n\nrace_c = MultipleChoice(cat(['question','article'],'\\n'),choices_list='option',labels='label',\n    dataset_name='tasksource/race-c')\n\nspartqa_yn=Classification(\"story\",\"question\",\"answer\",\n    dataset_name=\"tasksource/spartqa-yn\")\n\nspartqa_mc=MultipleChoice(cat([\"story\",\"question\"]),choices_list=\"candidate_answers\",labels=\"answer\",\n    dataset_name=\"tasksource/spartqa-mchoice\")\n\ntemporal_nli = Classification(\"Premise\",\"Hypothesis\",\"Label\",\n    dataset_name=\"tasksource/temporal-nli\")\n\nriddle_sense = MultipleChoice(\"question\", choices_list=get.choices.text, \n    labels=lambda x : \"ABCDE\".index(x['answerKey']))\n\nclcd = Classification(\n    \"sentence1\",\"sentence2\",\"label\",\n    dataset_name=\"tasksource/clcd-english\")\n\ntwentyquestions = Classification(\"question\",\"subject\",\"answer\",dataset_name=\"maximedb/twentyquestions\")\n\nreclor = MultipleChoice(cat([\"context\",\"question\"]),choices_list=\"answers\",labels=\"label\",\n    dataset_name=\"metaeval/reclor\",splits=['train','validation',None])\n\nc_aug_imdb = Classification(\"Text\",labels=\"Sentiment\",\n    dataset_name='tasksource/counterfactually-augmented-imdb')\n\nc_aug_snli = Classification(\"sentence1\",\"sentence2\",\"gold_label\",\n    dataset_name='tasksource/counterfactually-augmented-snli')\n\ncnli = Classification(\"premise\",\"hypothesis\",\"label\",\n    dataset_name='metaeval/cnli')\n\nperturbed_boolq = Classification(\"question\",labels=\"hard_label\",\n    dataset_name='tasksource/boolq-natural-perturbations')\n\n#mega_acceptability = Classification(\"sentence\",labels=\"average\",\n#    dataset_name='metaeval/mega-acceptability-v2')\n\ngraded_acceptability = Classification(\"text\",labels=\"normalized_score\",\n    dataset_name=\"metaeval/acceptability-prediction\")\n\nequate = Classification(\"sentence1\",\"sentence2\",\"gold_label\",\n    dataset_name='metaeval/equate')\n\nscience_qa = MultipleChoice(\"question\",choices_list=\"choices\",labels=\"answer\",\n    dataset_name=\"tasksource/ScienceQA_text_only\")\n\nekar=MultipleChoice(\"question\",choices_list=get.choices.text,\n    labels=lambda x:\"ABCD\".index(x['answerKey']),\ndataset_name=\"Jiangjie/ekar_english\")\n\nimplicit_hate = Classification(\"post\",labels=\"class\",\n    dataset_name=\"tasksource/implicit-hate-stg1\")\n\nnli_unambiguity = Classification(\"premise\",\"hypothesis\",\"gini\",\n    dataset_name=\"metaeval/chaos-mnli-ambiguity\")\n\nheadline_cause = Classification('left_title','right_title','label',\n    dataset_name='IlyaGusev/headline_cause',config_name='en_simple')\n\nlogiqa_2 = Classification(\"premise\",\"hypothesis\",\"label\",dataset_name=\"tasksource/logiqa-2.0-nli\")\n\n_oasst = dict(dataset_name=\"tasksource/oasst2_dense_flat\",\n    pre_process = lambda ds:ds.filter(lambda x:x['lang']=='en'))\n\noasst1__quality = Classification(\"parent_text\",\"text\",labels=\"quality\",**_oasst)\noasst1__toxicity = Classification(\"parent_text\",\"text\",labels=\"toxicity\",**_oasst)\noasst1__helpfulness = Classification(\"parent_text\",\"text\",labels=\"helpfulness\",**_oasst)\n\nmindgames = Classification(\"premise\",\"hypothesis\",\"label\",dataset_name=\"sileod/mindgames\")\n\ndef _udep_post_process(ds):\n    return ds.cast_column('labels', Sequence(ClassLabel(names=udep_en_labels)))\n\nudep__deprel = TokenClassification('tokens',lambda x:[udep_en_labels.index(a) for a in x['deprel']],\n    config_name=udep_en_configs,dataset_name=\"universal_dependencies\",post_process=_udep_post_process)\n\nambient= Classification(\"premise\",\"hypothesis\",\"hypothesis_ambiguous\",dataset_name=\"metaeval/ambient\")\n\npath_naturalness = MultipleChoice(constant(\"\"),choices=['choice1','choice2'],labels=\"label\",\n    dataset_name=\"metaeval/path-naturalness-prediction\")\n\ncivil_comments__toxicity = Classification(\"text\",labels=\"toxicity\")\ncivil_comments__severe_toxicity = Classification(\"text\",labels=\"severe_toxicity\")\ncivil_comments__obscene = Classification(\"text\",labels=\"obscene\")\ncivil_comments__threat = Classification(\"text\",labels=\"threat\")\ncivil_comments__insult = Classification(\"text\",labels=\"insult\")\ncivil_comments__identity_attack = Classification(\"text\",labels=\"identity_attack\")\ncivil_comments__sexual_explicit = Classification(\"text\",labels=\"sexual_explicit\")\n\ncloth = MultipleChoice(\"sentence\", choices_list=lambda x:[x[\"answer\"]]+x[\"distractors\"],labels=constant(0), dataset_name=\"AndyChiang/cloth\")\ndgen  = MultipleChoice(\"sentence\", choices_list=lambda x:[x[\"answer\"]]+x[\"distractors\"],labels=constant(0), dataset_name=\"AndyChiang/dgen\")\n\ni2d2 = Classification(\"sentence1\",labels=name('label',['False','True']), dataset_name=\"tasksource/I2D2\")\n\narg_me = Classification('argument','conclusion','stance', dataset_name=\"webis/args_me\")\nvalueeval_stance = Classification(\"Premise\",\"Conclusion\",\"Stance\", dataset_name=\"webis/Touche23-ValueEval\")\nstarcon = Classification('argument','topic','label',dataset_name=\"tasksource/starcon\")\n\nbanking77 = Classification(\"text\",labels=\"label\",dataset_name=\"PolyAI/banking77\")\n    \ncontrol = Classification('premise','hypothesis',\"label\",dataset_name=\"tasksource/ConTRoL-nli\")\ntracie = Classification(\"premise\",\"hypothesis\",\"answer\",dataset_name='tasksource/tracie')\nsherliic = Classification(\"premise\",\"hypothesis\",\"label\",dataset_name='tasksource/sherliic')\n\nsen_making__1 = MultipleChoice(constant('Chose most plausible:'), choices=['sentence0','sentence1'],labels='false', \n    dataset_name=\"tasksource/sen-making\")\n\nsen_making__2 = MultipleChoice(lambda x: [x['sentence0'],x['sentence1']][x['false']] + '\\n is not plausible because :',\n    choices=['A','B','C'],labels=lambda x: 'ABC'.index(x['reason']), dataset_name=\"tasksource/sen-making\")\n\nwinowhy = Classification('sentence', lambda x: f'In \"{x[\"wnli_sent1\"]}\", {x[\"wnli_sent2\"]}',\n    labels=name('label',['False','True']), dataset_name=\"tasksource/winowhy\")\n\n#for CFG in \"cognitive-bias\", \"fake-news\", \"gender-bias\", \"hate-speech\", \"linguistic-bias\", \"political-bias\", \"racial-bias\", \"text-level-bias\":\n#    print(f\"mbib__{CFG.replace('-','_')} = Classification('text',labels=name('label',['not {CFG}','{CFG}']), dataset_name='mediabiasgroup/mbib-base', config_name='{CFG}')\")\n\n\"\"\"\nmbib_cognitive_bias\t= Classification('text',labels=name('label',['not cognitive-bias','cognitive-bias']), dataset_name='mediabiasgroup/mbib-base', config_name='cognitive-bias')\nmbib_fake_news\t= Classification('text',labels=name('label',['not fake-news','fake-news']), dataset_name='mediabiasgroup/mbib-base', config_name='fake-news')\nmbib_gender_bias\t= Classification('text',labels=name('label',['not gender-bias','gender-bias']), dataset_name='mediabiasgroup/mbib-base', config_name='gender-bias')\nmbib_hate_speech\t= Classification('text',labels=name('label',['not hate-speech','hate-speech']), dataset_name='mediabiasgroup/mbib-base', config_name='hate-speech')\nmbib_linguistic_bias\t= Classification('text',labels=name('label',['not linguistic-bias','linguistic-bias']), dataset_name='mediabiasgroup/mbib-base', config_name='linguistic-bias')\nmbib_political_bias\t= Classification('text',labels=name('label',['not political-bias','political-bias']), dataset_name='mediabiasgroup/mbib-base', config_name='political-bias')\nmbib_racial_bias\t= Classification('text',labels=name('label',['not racial-bias','racial-bias']), dataset_name='mediabiasgroup/mbib-base', config_name='racial-bias')\nmbib_text_level_bias\t= Classification('text',labels=name('label',['not text-level-bias','text-level-bias']), dataset_name='mediabiasgroup/mbib-base', config_name='text-level-bias')\n\"\"\"\n\nrobustLR = Classification(\"context\",\"statement\",\"label\", dataset_name=\"tasksource/robustLR\")\n\ncluttr = Classification(\"story\",\"query\", \"target_text\",dataset_name=\"CLUTRR/v1\", config_name=\"gen_train234_test2to10\")\n\nlogical_fallacy = Classification(\"source_article\", labels=\"logical_fallacies\", dataset_name=\"tasksource/logical-fallacy\")\n\nparade = Classification(\"Definition1\",\"Definition2\", labels=name('Binary labels',[\"not-paraphrase\",\"paraphrase\"]), dataset_name=\"tasksource/parade\")\n\ncladder = Classification(\"given_info\", \"question\", \"answer\",dataset_name=\"tasksource/cladder\")\n\nsubjectivity = Classification(\"Sentence\",labels=\"Label\",dataset_name=\"tasksource/subjectivity\")\n\nmoh   = Classification(\"context\",\"expression\",\"label\", dataset_name=\"tasksource/MOH\")\nvuac  = Classification(\"context\",\"expression\",\"label\", dataset_name=\"tasksource/VUAC\")\ntrofi = Classification(\"context\",\"expression\",\"label\", dataset_name=\"tasksource/TroFi\", splits=['train',None,'test'])\n\nsharc_classification = Classification(\"snippet\", lambda x:f'{x[\"scenario\"]}\\n{x[\"question\"]}',\n    labels=lambda x:x[\"answer\"] if x['answer'] in  {\"Yes\",\"No\",\"Irrelevant\"} else \"Clarification needed\",\n    dataset_name='sharc_modified',config_name='mod')\n\nconceptrules_v2 = Classification(\"context\", \"text\", \"label\", dataset_name=\"tasksource/conceptrules_v2\")\n\nscidtb = Classification(\"unit1_txt\",\"unit2_txt\",\"label\", dataset_name=\"metaeval/disrpt\",config_name='eng.dep.scidtb.rels')\n\nchunking = TokenClassification(\"tokens\",\"chunk_tags\", dataset_name=\"conll2000\")\n\nfew_nerd = TokenClassification(\"tokens\",\"fine_ner_tags\",dataset_name=\"DFKI-SLT/few-nerd\",config_name='supervised')\nfiner = TokenClassification('tokens','ner_tags',dataset_name='nlpaueb/finer-139')\n\nlabel_nli = Classification(\"premise\",\"hypothesis\",\"labels\",dataset_name='tasksource/zero-shot-label-nli')\n\ncom2sense = Classification(\"sent\",labels=\"label\",dataset_name=\"tasksource/com2sense\",splits=['train',\"validation\",None])\n\nscone = Classification('sentence1_edited','sentence2_edited','gold_label_edited',dataset_name=\"tasksource/scone\")\n\nwinodict = MultipleChoice(cat(['definition','sentence']),['option1','option2'],'label',dataset_name='tasksource/winodict')\n\nfool_me_twice = Classification(\n    lambda x: \" \".join(a['text'] for a in x['gold_evidence']),\n    'text', 'label', dataset_name='tasksource/fool-me-twice')\n\nmonli = Classification(\"sentence1\",\"sentence2\",\"gold_label\", dataset_name=\"tasksource/monli\")\n\ncausality = Classification('premise','hypothesis','relation', dataset_name='tasksource/corr2cause')\n\nlsat = MultipleChoice(cat(['passage','question']), choices_list='references',labels='gold_index',dataset_name='lighteval/lsat_qa',config_name='all')\n\napt = Classification('text_a','text_b',name('labels',['not_paraphrase','paraphrase']),dataset_name='tasksource/apt')\n\n#xsum_factuality = Classification(\"summary\",labels=\"is_factual\")\n\nfinancial_sentiment = Classification(\"text\",labels=name('label',['Bearish','Bullish','Neutral']),\n    dataset_name=\"zeroshot/twitter-financial-news-sentiment\")\n\ndef _icl_rand(x):\n    import random\n    return random.Random(x['sentence1'][:50]).randint(0,1) #deterministic label for each input\n\nicl = Classification(\"inputs\", lambda x: x['symbols'][_icl_rand(x)],\n    labels=lambda x: str(x['symbols'][_icl_rand(x)]==x['targets']),\n    dataset_name=\"tasksource/icl-symbol-tuning-instruct\",\n    pre_process=lambda ds:ds.filter(lambda x:len(x['inputs'])<500*4), # 500 tokens of 4 char \n)\n\nspace_nli = Classification(\"premises\",\"hypothesis\",\"label\",dataset_name=\"tasksource/SpaceNLI\")\n\npropsegment = Classification(\"hypothesis\",\"premise\",\n    labels = lambda x:{'n':'neutral','e':'entailment','c':'contradiction'}[x['label']],\n    dataset_name=\"sihaochen/propsegment\",config_name='nli')\n\nhatemoji = Classification('text',labels=name(\"label_gold\", ['not-hate-speech','hate-speech']),\n    dataset_name=\"HannahRoseKirk/HatemojiBuild\")\n\nregset = Classification(\"context\",labels=\"answer\",dataset_name='tasksource/regset')\n\nesci = Classification('query','product_text','esci_label',\n    dataset_name=\"tasksource/esci\",\n    pre_process=lambda ds:ds.filter(lambda x:x['product_locale']=='us'))\n\ndef _preprocess_chatbot_arena(ds):\n    ds=ds.filter(lambda x:x['winner'] in [\"model_a\",\"model_b\"])\n    ds=ds.filter(lambda x:x['language']==\"English\")\n\n    def _unroll(x):\n        f=lambda x:\"\\n\".join([f\"{turn['role']}:\\n{turn['content']}\" for turn in x])\n        x['conversation_a'] = f(x['conversation_a'])\n        x['conversation_b'] = f(x['conversation_b'])\n        return x\n    ds=ds.map(_unroll)\n    return ds\n\nchatbot_arena = MultipleChoice(constant(\"\"),\n    choices=[\"conversation_a\",\"conversation_b\"],\n    labels=lambda x: [\"model_a\",\"model_b\"].index(x[\"winner\"]),\n    dataset_name=\"lmsys/chatbot_arena_conversations\",\n    pre_process=_preprocess_chatbot_arena)\n\ndnd_intent = Classification(\"examples\",labels=\"label_names\",\n    dataset_name='neurae/dnd_style_intents')\n\nfld = Classification(\"context\",\"hypothesis\", \"proof_label\",\n    dataset_name=\"hitachi-nlp/FLD.v2\",config_name=\"default\")\n\nflds = Classification(\"context\",\"hypothesis\", \"proof_label\",\n    dataset_name=\"hitachi-nlp/FLD.v2\",config_name=\"star\")\n\nsdoh_nli = Classification(\"premise\",\"hypothesis\",labels=lambda x:{True:\"entailment\",False:\"not_entailment\"}[x['label']],\n    dataset_name=\"tasksource/SDOH-NLI\")\n\nscifact_entailment = Classification(lambda x:\"\\n\".join(x[\"abstract\"]),\"claim\",\n    labels=lambda x:x['verdict'].replace('NEI','NEUTRAL').lower(),\n    dataset_name=\"allenai/scifact_entailment\")\n\nfeasibilityQA = Classification(cat(['knowledge','premise']),'hypothesis','binary_classification_label',\n    dataset_name=\"tasksource/feasibilityQA\")\n                               \nsimple_pair = Classification(\"premise\",\"hypothesis\",\"label\", dataset_name=\"tasksource/simple_pair\")\nadjective_scale_probe = Classification(\"premise\",\"hypothesis\",\"label\", dataset_name=\"tasksource/AdjectiveScaleProbe-nli\")\nrepectively_nli = Classification(\"premise\",\"hypothesis\",\"label\",dataset_name=\"tasksource/resnli\")\n\nspartun=MultipleChoice(cat([\"story\",\"question\"]),choices_list=\"candidate_answers\",\n    labels=lambda x: [c.lower() for c in x['choices_list']].index(x[\"answer\"][0].lower()),\n    pre_process=lambda ds:ds.filter(lambda x:len(x['answer'])==1),\n    dataset_name=\"tasksource/SpaRTUN\")\n\nresq=MultipleChoice(cat([\"story\",\"question\"]),choices_list=\"candidate_answers\",\n    labels=lambda x: [c.lower() for c in x['choices_list']].index(x[\"answer\"][0].lower()),\n    pre_process=lambda ds:ds.filter(lambda x:len(x['answer'])==1),\n    dataset_name=\"tasksource/ReSQ\")\n\nsemantic_fragments_nli = Classification(\"sentence1\",\"sentence2\",\"gold_label\",\n    dataset_name=\"tasksource/semantic_fragments_nli\")\n\nmoritz_zs_nli = Classification('text','hypothesis','labels',\n    pre_process=lambda ds:ds.filter(lambda x:x['task_name'] not in  [\"mnli\", \"anli\", \"fevernli\", \"wanli\", \"lingnli\"]),\n    dataset_name=\"MoritzLaurer/dataset_train_nli\"\n) \n\nstepgame = Classification('story','question','label',dataset_name=\"tasksource/stepgame\")\n\ndef _nlgraph_binarize(x):\n    a=x['answer'].lower()\n    if \"yes\" in a: return \"True\"\n    if \"no\" in a: return \"False\"\n    assert False\n\nnlgraph = Classification('question',labels=_nlgraph_binarize,\n    pre_process=lambda ds:ds.filter(lambda x:x['task'] in \"connectivity cycle hamilton\"),\n    dataset_name=\"tasksource/nlgraph\")\n\noasst_rlhf = MultipleChoice(\"prompt\",choices=['chosen','rejected'],labels=constant(0),\n    dataset_name=\"tasksource/oasst2_pairwise_rlhf_reward\")\n\nanthropic_rlhf_helpfulness = MultipleChoice(constant('Most helpful assistant answer:'), ['chosen','rejected'], constant(0),\n    dataset_name=\"tasksource/hh-rlhf\",config_name=[\"helpful-base\", \"helpful-online\", \"helpful-rejection-sampled\"])\n\nanthropic_rlhf_harmless = MultipleChoice(constant('Most harmless assistant answer:'), ['chosen','rejected'], constant(0),\n    dataset_name=\"tasksource/hh-rlhf\",config_name=\"harmless-base\")\n\nruletaker = Classification(\n    lambda x: 'What is not explicitly stated as true is considered false. \\n' +x[\"context\"], #closed world assumption\n    \"question\",\"label\",dataset_name=\"tasksource/ruletaker\")\n\npara_rules = Classification(\n    lambda x: 'What is not explicitly stated as true is considered false. \\n' +x[\"context\"], #closed world assumption\n    \"question\", labels=name(\"label\",[\"False\",\"True\"]),\n    dataset_name=\"qbao775/PARARULE-Plus\")\n\nproofwriter_deduction = Classification(\"theory\",\"question\",\"answer\",\n    dataset_name=\"tasksource/proofwriter\") #open world assumption\n\nlogical_entailment = Classification(\"A\",\"B\",\"label\",dataset_name='tasksource/logical-entailment')\n\nnope = Classification('premise','hypothesis',\n    labels=lambda x:dict(E='entailment',N='neutral',C='contradiction').get(x['label'],x['label']),\n    dataset_name='tasksource/nope')\n\nlogicNLI = Classification('premise','hypothesis','label',dataset_name='tasksource/LogicNLI')\n\ncontract_nli__seg = Classification(\"premise\",\"hypothesis\",\"label\", dataset_name=\"kiddothe2b/contract-nli\",config_name=\"contractnli_a\")\n\ncontract_nli__full = Classification(\"premise\",\"hypothesis\",\"label\", dataset_name=\"kiddothe2b/contract-nli\",config_name=\"contractnli_b\")\n\nnli4ct = Classification(lambda x: \"\\n\".join(x['Primary_evidence']),'Statement',\"Label\",\n    dataset_name=\"AshtonIsNotHere/nli4ct_semeval2024\",splits=['train','dev',None])\n\nlsat_ar = MultipleChoice(\n    cat(['context','question']),\n    choices_list='answers',labels=\"label\",\n     dataset_name=\"tasksource/lsat-ar\")\n    \nlsat_rc = MultipleChoice(\n    cat(['context','question']),\n    choices_list='answers',labels=\"label\",\n     dataset_name=\"tasksource/lsat-rc\")\n    \nbiosift_nli = Classification(\"Abstract\",\"Hypothesis\",\n    labels=lambda x: {True:\"entailment\",False:\"not-entailment\"}[bool(x['Entailment'])],\n    dataset_name=\"AshtonIsNotHere/biosift-nli\")\n\nbrainteasers = MultipleChoice(\"question\",\n    choices_list=lambda x:eval(x[\"choice_list\"]),\n    labels=\"label\",\n    dataset_name=\"tasksource/brainteasers\",config_name=['WP','SP'])\n\n#GATED !\n#toxigen = Classification(\"text\",labels=\"toxicity_human\", dataset_name=\"skg/toxigen-data\")\n\npersuasiveness = Classification(\"claim\",\"argument\",labels=\"persuasiveness_metric\",dataset_name=\"Anthropic/persuasion\")\n\n#ste_wic = Classification(cat(\"text_1\",\"text_2\"),\n#    lambda x:f\"{x['target']} means the same thing in these texts\",\n#    \"gold_label_binary\",\n#    dataset_name=\"cardiffnlp/super_tweeteval\", config_name=\"tempo_wic\",splits=['train','validation',None])\n\n#ste_nerd = Classification(\"text\",\n#    lambda x:f\"definition of {x['target']} here is 'x{['definition']}'\",\n#    \"gold_label_binary\",\n#    dataset_name=\"cardiffnlp/super_tweeteval\", config_name=\"tweet_nerd\",splits=['train','validation',None])\n \n#ste_sim = Classification(\"text_1\",\"text_2\",lambda x:x['gold_score']/5,\n#    dataset_name=\"cardiffnlp/super_tweeteval\",config_name=\"tweet_similarity\",splits=['train','validation',None])\n\n#ste_intimacy = Classification(\"text_1\",labels=lambda x:x['gold_score']/5,\n#    dataset_name=\"cardiffnlp/super_tweeteval\",config_name=\"tweet_intimacy\")\n\n#ccdv/patent-classification|abstract text label\n\nambigNQ = Classification(\"question\",labels=lambda x:{True:\"ambiguous\", False:\"not ambiguous\"}.get(x[\"ambig\"]),\n    dataset_name=\"erbacher/AmbigNQ-clarifying-question\")\n\nsiga_nli = Classification(\"premise\",\"statement\",\"label\",dataset_name=\"tasksource/SIGA-nli\")\n\nunigram_fol = Classification(\"premise\",\"hypothesis\",\"label\",dataset_name='unigram/FOL-nli')\n\n#gs_goal = MultipleChoice(\"sent2\",regen(\"ending[0-3]\"),\"label\",\n#        dataset_name=\"tasksource/goal-step-wikihow\",config_name=\"goal\")\n\n#gs_step = MultipleChoice(\"sent2\",regen(\"ending[0-3]\"),\"label\",\n#        dataset_name=\"tasksource/goal-step-wikihow\",config_name=\"step\")\n\ngs_order = MultipleChoice(\"sent2\",regen(\"ending[0-1]\"),\"label\",\n        dataset_name=\"tasksource/goal-step-wikihow\",config_name=\"order\")\n\nparadise = MultipleChoice(\"sent2\",regen(\"ending[0-3]\"),\"label\",\n      dataset_name=\"GGLab/PARADISE\")\n\ndocnli = Classification(\"premise\",\"hypothesis\",\"label\",dataset_name=\"tasksource/doc-nli\")\n\nmctest_nli = Classification(\"premise\",\"hypothesis\",\"label\",dataset_name=\"tasksource/mctest-nli\")\n\npatent_phrase_similarity = Classification(\"anchor\",\"target\",\"label\",dataset_name=\"tasksource/patent-phrase-similarity\")\n\nnlsat = Classification('sentence',labels='label',dataset_name=\"tasksource/natural-language-satisfiability\")\n\nidioms_nli = Classification('premise','hypothesis','label',dataset_name=\"tasksource/idioms-nli\")\n\nlifeycle_entailment = Classification(\"premise\",\"hypothesis\",\"label\",dataset_name='tasksource/lifecycle-entailment')\n\n\nhelpsteer__helpfulness = Classification(\"prompt\", \"response\", \"helpfulness\", dataset_name=\"nvidia/HelpSteer\")\nhelpsteer__correctness = Classification(\"prompt\", \"response\", \"correctness\", dataset_name=\"nvidia/HelpSteer\")\nhelpsteer__coherence = Classification(\"prompt\", \"response\", \"coherence\", dataset_name=\"nvidia/HelpSteer\")\nhelpsteer__complexity = Classification(\"prompt\", \"response\", \"complexity\", dataset_name=\"nvidia/HelpSteer\")\nhelpsteer__verbosity = Classification(\"prompt\", \"response\", \"verbosity\", dataset_name=\"nvidia/HelpSteer\")\n\nhelpsteer_2__helpfulness = Classification(\"prompt\",\"response\",\"helpfulness\",dataset_name=\"nvidia/HelpSteer2\")\nhelpsteer_2__correctness = Classification(\"prompt\", \"response\", \"correctness\", dataset_name=\"nvidia/HelpSteer2\")\nhelpsteer_2__coherence = Classification(\"prompt\", \"response\", \"coherence\", dataset_name=\"nvidia/HelpSteer2\")\nhelpsteer_2__complexity = Classification(\"prompt\", \"response\", \"complexity\", dataset_name=\"nvidia/HelpSteer2\")\nhelpsteer_2__verbosity = Classification(\"prompt\", \"response\", \"verbosity\", dataset_name=\"nvidia/HelpSteer2\")\n\nmsci_nli = Classification('sentence1','sentence2','label',dataset_name='sadat2307/MSciNLI')\n\n#lex_glue___ecthr_a = Classification(sentence1=\"text\", labels=\"labels\",dataset_name=\"coastalcph/lex_glue\",config_name=\"ecthr_a\") # too long\n#lex_glue___ecthr_b = Classification(sentence1=\"text\", labels=\"labels\") # too long\n\nultrafeedback = MultipleChoice(\"question\", choices=['response_j','response_k'],labels=constant(0), dataset_name=\"pushpdeep/UltraFeedback-paired\")\n\nessay_scoring = Classification(\"full_text\",labels=\"score\",dataset_name='tasksource/AES2-essay-scoring')\n\n#argument_feedback = Classification(\"discourse_text\",labels=\"discourse_effectiveness\", dataset_name=\"tasksource/argument-feedback\")\n\neg = lambda x: Classification(\"full_text\", labels=lambda y:int(y[x]), dataset_name=\"tasksource/english-grading\")\ngrading__cohesion = eg('cohesion')\ngrading__syntax = eg('syntax')\ngrading__vocabulary = eg('vocabulary')\ngrading__phraseology = eg('phraseology')\ngrading__grammar = eg('grammar')\ngrading__conventions = eg('conventions')\n\nwice = Classification(lambda x: \"\\n\".join(x['evidence']),'claim','label',\n    dataset_name='tasksource/wice')\n\nhover = Classification(\"evidence\",\"claim\",\"label\",\n    dataset_name=\"Dzeniks/hover\") \n\nhover__nli = Classification(\"evidence\",\"claim\",name(\"label\",[\"entailment\",\"neutral\",\"contradiction\"]),\n    dataset_name=\"Dzeniks/hover-3way\")\n\ntasksource_dpo = MultipleChoice(\"prompt\",choices=['chosen','rejected'],labels=constant(0),\n    dataset_name=\"tasksource/tasksource_dpo_pairs\")\n\nseahorse = Classification('article',cat([\"summary\", \"question\"]),'answer',\n    dataset_name=\"tasksource/seahorse_summarization_evaluation\")\n\nmip = Classification(\"prompt\",labels=\"y\",\n    dataset_name=\"sileod/missing-item-prediction\",config_name=\"contrastive\")\n\njigsaw_toxicity = Classification('comment_text',labels=name(\"toxic\",[\"notthate\",\"hate\"]),\n    dataset_name=\"tasksource/jigsaw_toxicity\")\n\npol_nli = Classification(\"premise\",\"hypothesis\",labels=name('entailment',['entailment','not_entailment']),\n    dataset_name=\"mlburnham/Pol_NLI\")\n\nsynthetic_retrieval_nli = Classification('premise','hypothesis','label',dataset_name='tasksource/synthetic-retrieval-NLI',\n    config_name=[\"binary\",\"count\",\"position\"],\n    pre_process=lambda ds:ds.filter(lambda x:x['n']<=2048))\n\nissue_similarity = Classification(\"text1\",\"text2\",\"label\",\n    dataset_name=\"WhereIsAI/github-issue-similarity\")\n\n#nli_l2 = Classification(\"sentence1\",\"sentence2\",\"labels\",\n#    dataset_name=\"tasksource/merged-2l-nli\")\n\n#nli_l3 =  Classification(\"sentence1\",\"sentence2\",\"labels\",\n#    dataset_name=\"tasksource/merged-3l-nli\")\n"
  },
  {
    "path": "src/tasksource/__init__.py",
    "content": "from .tasks import *\nfrom .preprocess import *\nfrom .access import *\n"
  },
  {
    "path": "src/tasksource/access.py",
    "content": "from .preprocess import Preprocessing\nimport re\nimport pandas as pd\nfrom . import tasks, recast\nfrom .metadata import dataset_rank\nfrom datasets import load_dataset\nimport funcy as fc\nimport os\nimport copy\nfrom sorcery import dict_of\nfrom functools import cache\nimport random\n\n\nclass lazy_mtasks:\n    def __getattr__(self, name):\n        from . import mtasks\n        return getattr(mtasks, name)\n\n    def __dir__(self):\n        from . import mtasks\n        return dir(mtasks)\nlmtasks=lazy_mtasks()\n\ndef parse_var_name(s):\n    config_name,task_name = None,None\n    if '__' in s and '___' not in s: # dataset__task\n        dataset_name, task_name = s.split('__') \n    elif '__' not in s.replace('___','') and '___' in s: #dataset___config\n        dataset_name, config_name = s.split('___') \n    elif  '___' in s and '__' in s.split('___')[1]: #dataset___config__task\n        dataset_name, config_task=s.split('___')\n        config_name,task_name = config_task.split('__')\n    else: # dataset \n        dataset_name = s\n    return dataset_name,config_name,task_name\n\ndef pretty_name(x):\n    dn = x.dataset_name.split(\"/\")[-1]   \n    cn = x.config_name if x.config_name else \"\"\n    tn = x.task_name if x.task_name else \"\"\n    return f\"{dn}/{cn}/{tn}\".replace('//','/').rstrip('/')\n\n@cache\ndef list_tasks(tasks_path=f'{os.path.dirname(__file__)}/tasks.py',multilingual=False,instruct=False, excluded=[]):\n    if multilingual:\n        tasks_path=tasks_path.replace('/tasks.py','/mtasks.py')\n    task_order = open(tasks_path).readlines()\n    task_order = [x.split('=')[0].rstrip() for x in task_order if '=' in x]\n    task_order = [x for x in task_order if x.isidentifier()]\n    task_order = fc.flip(dict(enumerate(task_order)))\n\n    l = []\n    _tasks = (lmtasks if multilingual else tasks)\n\n    for key in dir(_tasks):\n        if key not in task_order:\n            continue\n        value=getattr(_tasks, key)\n        if isinstance(value,Preprocessing):\n            dataset_name, config_name, task_name = parse_var_name(key)\n            dataset_name = (value.dataset_name if value.dataset_name else dataset_name)\n            config_name = (value.config_name if value.config_name else config_name)\n            hasattr(value,key)\n            l+=[{'dataset_name': dataset_name,\n                 'config_name' : config_name,\n                 'task_name': task_name,\n                 'preprocessing_name': key,\n                'task_type': value.__class__.__name__,'mapping': value,\n                'rank':task_order.get(key,None)}]   \n    df=pd.DataFrame(l).explode('config_name')\n    df = df.sort_values('rank').reset_index(drop=True)\n    df['id'] = df.apply(lambda x: pretty_name(x), axis=1)\n    df.insert(0, 'id', df.pop('id'))\n    del df['rank']\n    if instruct:\n        df=df[df.id.map(lambda x: not any(a in x for a in recast.improper_labels))]\n    df=df[df.id.map(lambda x: not any(x in a for a in excluded))]\n    return df\n\n#task_df =list_tasks()\n#mtask_df =list_tasks(multilingual=True)\n\ndef dict_to_query(d=dict(), **kwargs):\n    d={**d,**kwargs}\n    return '&'.join([f'`{k}`==\"{v}\"' for k,v in d.items()])\n\ndef load_preprocessing(tasks=tasks, **kwargs):\n    _tasks_df = list_tasks(multilingual=tasks==lmtasks)\n    y = _tasks_df.copy().query(dict_to_query(**kwargs)).iloc[0]\n    preprocessing= copy.copy(getattr(tasks, y.preprocessing_name))\n    for c in 'dataset_name','config_name':\n        if not isinstance(getattr(preprocessing,c), str):\n             setattr(preprocessing,c,getattr(y,c))\n    return preprocessing\n\ndef load_task(id=None, dataset_name=None,config_name=None,task_name=None,preprocessing_name=None,\n         max_rows=None, max_rows_eval=None, multilingual=False, instruct=False, seed=0, **load_dataset_kwargs):\n    query = dict_of(id, dataset_name, config_name, task_name,preprocessing_name)\n    query = {k:v for k,v in query.items() if v}\n    _tasks = (lmtasks if multilingual else tasks)\n    preprocessing = load_preprocessing(_tasks, **query)\n\n    if \"trust_remote_code\" not in load_dataset_kwargs:\n        load_dataset_kwargs[\"trust_remote_code\"] = True\n    \n    dataset = load_dataset(preprocessing.dataset_name, preprocessing.config_name, **load_dataset_kwargs)\n    dataset= preprocessing(dataset,max_rows, max_rows_eval)\n    dataset.task_type = preprocessing.__class__.__name__\n    if instruct:\n        dataset=recast.recast_instruct(dataset)\n    return dataset"
  },
  {
    "path": "src/tasksource/metadata/__init__.py",
    "content": "from .bigbench_groups import *\nfrom .blimp_groups import *\nfrom .popularity import *\n\nimppres_presupposition=['presupposition_all_n_presupposition',\n 'presupposition_both_presupposition',\n 'presupposition_change_of_state',\n 'presupposition_cleft_existence',\n 'presupposition_cleft_uniqueness',\n 'presupposition_only_presupposition',\n 'presupposition_possessed_definites_existence',\n 'presupposition_possessed_definites_uniqueness',\n 'presupposition_question_presupposition']\n\nimppres_implicature=['implicature_connectives',\n 'implicature_gradable_adjective',\n 'implicature_gradable_verb',\n 'implicature_modals',\n 'implicature_numerals_10_100',\n 'implicature_numerals_2_3',\n 'implicature_quantifiers']\n\ncrossfit=['emo',\n 'wiki_auto',\n 'liar',\n 'tab_fact',\n 'sms_spam',\n 'google_wellformed_query',\n 'glue',\n 'poem_sentiment',\n 'emotion',\n 'hate_speech18',\n 'hatexplain',\n 'yahoo_answers_topics',\n 'mc_taco',\n 'glue',\n 'mocha',\n 'super_glue',\n 'glue',\n 'yelp_polarity',\n 'tweet_eval',\n 'glue',\n 'art',\n 'super_glue',\n 'ethos',\n 'app_reviews',\n 'yelp_review_full',\n 'anli',\n 'hate_speech_offensive',\n 'climate_fever',\n 'circa',\n 'financial_phrasebank',\n 'wiki_qa',\n 'rotten_tomatoes',\n 'trec',\n 'medical_questions_pairs',\n 'glue',\n 'super_glue',\n 'ade_corpus_v2',\n 'sick',\n 'super_glue',\n 'blimp',\n 'discovery',\n 'health_fact',\n 'ag_news',\n 'boolq',\n 'glue',\n 'amazon_polarity',\n 'scicite',\n 'dbpedia_14',\n 'onestop_english',\n 'crows_pairs',\n 'scitail',\n 'piqa',\n 'glue',\n 'paws',\n 'imdb',\n 'glue',\n 'trec']\n\n#en_esl, en_gumreddit are faulty on HF \nudep_en_configs = ['en_ewt', 'en_gum', 'en_lines', 'en_partut']\nudep_en_labels = ['_', 'acl', 'acl:relcl', 'advcl', 'advmod', 'amod', 'appos', 'aux', 'aux:pass', 'case', 'cc', 'cc:preconj', 'ccomp', 'compound', 'compound:prt', 'conj', 'cop', 'csubj', 'csubj:pass', 'dep', 'det', 'det:predet', 'discourse', 'dislocated', 'expl', 'fixed', 'flat', 'flat:foreign', 'goeswith', 'iobj', 'list', 'mark', 'nmod', 'nmod:npmod', 'nmod:poss', 'nmod:tmod', 'nsubj', 'nsubj:pass', 'nummod', 'obj', 'obl', 'obl:npmod', 'obl:tmod', 'orphan', 'parataxis', 'punct', 'reparandum', 'root', 'vocative', 'xcomp']\n\nudep_labels = ['_', 'acl', 'acl:adv', 'acl:appos', 'acl:attr', 'acl:cleft', 'acl:focus', 'acl:inf', 'acl:part', 'acl:periph', 'acl:poss', 'acl:relat', 'acl:relcl', 'advcl', 'advcl:arg', 'advcl:cleft', 'advcl:cmpr', 'advcl:cond', 'advcl:coverb', 'advcl:lmod', 'advcl:mmod', 'advcl:periph', 'advcl:relcl', 'advcl:sp', 'advcl:svc', 'advcl:tcl', 'advcl:tmod', 'advmod', 'advmod:arg', 'advmod:cc', 'advmod:deg', 'advmod:det', 'advmod:df', 'advmod:emph', 'advmod:lmod', 'advmod:locy', 'advmod:mmod', 'advmod:mode', 'advmod:neg', 'advmod:periph', 'advmod:que', 'advmod:tfrom', 'advmod:tlocy', 'advmod:tmod', 'advmod:to', 'advmod:tto', 'amod', 'amod:advmod', 'amod:att', 'amod:emph', 'amod:flat', 'amod:mode', 'amod:obl', 'appos', 'appos:trans', 'aux', 'aux:aglt', 'aux:aspect', 'aux:caus', 'aux:clitic', 'aux:cnd', 'aux:imp', 'aux:mood', 'aux:neg', 'aux:opt', 'aux:part', 'aux:pass', 'aux:poss', 'aux:q', 'aux:tense', 'case', 'case:acc', 'case:adv', 'case:circ', 'case:dec', 'case:det', 'case:gen', 'case:loc', 'case:pred', 'case:pref', 'case:voc', 'cc', 'cc:nc', 'cc:preconj', 'ccomp', 'ccomp:agent', 'ccomp:cleft', 'ccomp:obj', 'ccomp:obl', 'ccomp:pmod', 'ccomp:pred', 'clf', 'compound', 'compound:a', 'compound:affix', 'compound:coll', 'compound:conjv', 'compound:dir', 'compound:ext', 'compound:lv', 'compound:lvc', 'compound:nn', 'compound:nv', 'compound:plur', 'compound:preverb', 'compound:prt', 'compound:quant', 'compound:redup', 'compound:smixut', 'compound:svc', 'compound:vo', 'compound:vv', 'conj', 'conj:expl', 'conj:extend', 'conj:svc', 'cop', 'cop:expl', 'cop:locat', 'cop:own', 'csubj', 'csubj:cleft', 'csubj:cop', 'csubj:pass', 'dep', 'dep:alt', 'dep:comp', 'dep:mod', 'dep:prt', 'det', 'det:adj', 'det:def', 'det:noun', 'det:numgov', 'det:nummod', 'det:poss', 'det:predet', 'det:pron', 'det:rel', 'discourse', 'discourse:emo', 'discourse:filler', 'discourse:intj', 'discourse:sp', 'dislocated', 'dislocated:acl', 'dislocated:cleft', 'dislocated:conj', 'dislocated:nmod', 'dislocated:nsubj', 'dislocated:obj', 'dislocated:obl', 'expl', 'expl:comp', 'expl:impers', 'expl:pass', 'expl:poss', 'expl:pv', 'expl:subj', 'fixed', 'flat', 'flat:abs', 'flat:foreign', 'flat:name', 'flat:num', 'flat:range', 'flat:repeat', 'flat:sibl', 'flat:title', 'flat:vv', 'goeswith', 'iobj', 'iobj:agent', 'iobj:appl', 'iobj:caus', 'iobj:loc', 'iobj:patient', 'list', 'mark', 'mark:adv', 'mark:advb', 'mark:comp', 'mark:prt', 'mark:rel', 'mark:relcl', 'nmod', 'nmod:abl', 'nmod:advmod', 'nmod:agent', 'nmod:appos', 'nmod:arg', 'nmod:att', 'nmod:attr', 'nmod:bahuv', 'nmod:cau', 'nmod:clas', 'nmod:cmp', 'nmod:comp', 'nmod:dat', 'nmod:flat', 'nmod:gen', 'nmod:gmod', 'nmod:gobj', 'nmod:gsubj', 'nmod:lmod', 'nmod:npmod', 'nmod:obl', 'nmod:obllvc', 'nmod:own', 'nmod:part', 'nmod:periph', 'nmod:pmod', 'nmod:poss', 'nmod:pred', 'nmod:ref', 'nmod:relat', 'nmod:tmod', 'nsubj', 'nsubj:appos', 'nsubj:bfoc', 'nsubj:caus', 'nsubj:cop', 'nsubj:ifoc', 'nsubj:lfoc', 'nsubj:lvc', 'nsubj:nc', 'nsubj:obj', 'nsubj:own', 'nsubj:pass', 'nsubj:periph', 'nummod', 'nummod:det', 'nummod:entity', 'nummod:flat', 'nummod:gov', 'nummod:mod', 'nummod:periph', 'obj', 'obj:advmod', 'obj:agent', 'obj:appl', 'obj:cau', 'obj:caus', 'obj:lvc', 'obj:periph', 'obl', 'obl:abl', 'obl:advmod', 'obl:agent', 'obl:appl', 'obl:arg', 'obl:ben', 'obl:cmpr', 'obl:inst', 'obl:lmod', 'obl:loc', 'obl:mod', 'obl:npmod', 'obl:own', 'obl:patient', 'obl:pmod', 'obl:poss', 'obl:prep', 'obl:sentcon', 'obl:smod', 'obl:soc', 'obl:tmod', 'obl:x', 'orphan', 'parataxis', 'parataxis:appos', 'parataxis:conj', 'parataxis:deletion', 'parataxis:discourse', 'parataxis:dislocated', 'parataxis:hashtag', 'parataxis:insert', 'parataxis:newsent', 'parataxis:nsubj', 'parataxis:obj', 'parataxis:parenth', 'parataxis:rel', 'parataxis:rep', 'parataxis:restart', 'parataxis:speech', 'parataxis:trans', 'punct', 'reparandum', 'root', 'vocative', 'vocative:mention', 'xcomp', 'xcomp:adj', 'xcomp:cleft', 'xcomp:ds', 'xcomp:obj', 'xcomp:obl', 'xcomp:pred', 'xcomp:sp', 'xcomp:subj']"
  },
  {
    "path": "src/tasksource/metadata/bigbench_groups.py",
    "content": "bigbench_discriminative = set(\"\"\"abstract_narrative_understanding\r\nanachronisms\r\nanalogical_similarity\r\nanalytic_entailment\r\narithmetic\r\nauthorship_verification\r\nbbq_lite_json\r\ncausal_judgment\r\ncause_and_effect\r\ncheckmate_in_one\r\ncifar10_classification\r\ncode_line_description\r\ncolor\r\ncommon_morpheme\r\nconceptual_combinations\r\ncontextual_parametric_knowledge_conflicts\r\ncrash_blossom\r\ncrass_ai\r\ncryobiology_spanish\r\ncs_algorithms\r\ndark_humor_detection\r\ndate_understanding\r\ndisambiguation_qa\r\ndiscourse_marker_prediction\r\ndyck_languages\r\nelementary_math_qa\r\nemoji_movie\r\nemojis_emotion_prediction\r\nempirical_judgments\r\nenglish_proverbs\r\nenglish_russian_proverbs\r\nentailed_polarity\r\nentailed_polarity_hindi\r\nepistemic_reasoning\r\nevaluating_information_essentiality\r\nfact_checker\r\nfantasy_reasoning\r\nfigure_of_speech_detection\r\nformal_fallacies_syllogisms_negation\r\ngeneral_knowledge\r\ngeometric_shapes\r\ngoal_step_wikihow\r\ngre_reading_comprehension\r\nhhh_alignment\r\nhindu_knowledge\r\nhinglish_toxicity\r\nhuman_organs_senses\r\nhyperbaton\r\nidentify_math_theorems\r\nidentify_odd_metaphor\r\nimplicatures\r\nimplicit_relations\r\nindic_cause_and_effect\r\nintent_recognition\r\ninternational_phonetic_alphabet_nli\r\nintersect_geometry\r\nirony_identification\r\nkannada\r\nkey_value_maps\r\nknown_unknowns\r\nlanguage_identification\r\nlogic_grid_puzzle\r\nlogical_args\r\nlogical_deduction\r\nlogical_fallacy_detection\r\nlogical_sequence\r\nmathematical_induction\r\nmedical_questions_russian\r\nmetaphor_boolean\r\nmetaphor_understanding\r\nmisconceptions\r\nmisconceptions_russian\r\nmnist_ascii\r\nmoral_permissibility\r\nmovie_dialog_same_or_different\r\nmovie_recommendation\r\nnavigate\r\nnonsense_words_grammar\r\nnovel_concepts\r\nodd_one_out\r\nparsinlu_qa\r\npenguins_in_a_table\r\npersian_idioms\r\nphrase_relatedness\r\nphysical_intuition\r\nphysics\r\nplay_dialog_same_or_different\r\npresuppositions_as_nli\r\nquestion_selection\r\nreal_or_fake_text\r\nreasoning_about_colored_objects\r\nriddle_sense\r\nruin_names\r\nsalient_translation_error_detection\r\nsentence_ambiguity\r\nsimilarities_abstraction\r\nsimple_arithmetic_json_multiple_choice\r\nsimple_ethical_questions\r\nsnarks\r\nsocial_iqa\r\nsocial_support\r\nsports_understanding\r\nstrange_stories\r\nstrategyqa\r\nsuicide_risk\r\nswahili_english_proverbs\r\nswedish_to_german_proverbs\r\nsymbol_interpretation\r\ntemporal_sequences\r\ntimedial\r\ntracking_shuffled_objects\r\nunderstanding_fables\r\nundo_permutation\r\nunit_interpretation\r\nvitaminc_fact_verification\r\nwhat_is_the_tao\r\nwhich_wiki_edit\r\nwinowhy\"\"\".split('\\n')) - {'simple_arithmetic_json_multiple_choice'}\r\n\r\nbigbench_non_english = set(\"\"\"common_morpheme\r\ncryobiology_spanish\r\ngem\r\ngender_inclusive_sentences_german\r\nkanji_ascii\r\nkannada\r\nlanguage_identification\r\nlinguistic_mappings\r\nmedical_questions_russian\r\nmisconceptions_russian\r\nmultiemo\r\npersian_idioms\r\npolish_sequence_labeling\r\nswahili_english_proverbs\r\nswedish_to_german_proverbs\r\nwhat_is_the_tao\r\nwhich_wiki_edit\"\"\".split('\\n')) | {\"parsinlu_qa\",\"hinglish_toxicity\",\"indic_cause_and_effect\",\"entailed_polarity_hindi\",\"english_russian_proverbs\"}\r\n\r\nbbl=set('''auto_debugging\r\nbbq_lite_json\r\ncode_line_description\r\nconceptual_combinations\r\nconlang_translation\r\nemoji_movie\r\nformal_fallacies_syllogisms_negation\r\nhindu_knowledge\r\nknown_unknowns\r\nlanguage_identification\r\nlinguistics_puzzles\r\nlogic_grid_puzzle\r\nlogical_deduction\r\nmisconceptions_russian\r\nnovel_concepts\r\noperators\r\nparsinlu_reading_comprehension\r\nplay_dialog_same_or_different\r\nrepeat_copy_logic\r\nstrange_stories\r\nstrategyqa\r\nsymbol_interpretation\r\nvitaminc_fact_verification\r\nwinowhy'''.split('\\n'))\r\n\r\nbigbench_discriminative_english = bigbench_discriminative - bigbench_non_english"
  },
  {
    "path": "src/tasksource/metadata/blimp_groups.py",
    "content": "import pandas as pd\n\ndfh=pd.read_csv('https://raw.githubusercontent.com/alexwarstadt/blimp/master/raw_results/summary/human_validation_summary.csv')\ndfh['linguistic_term']=dfh['Condition']\ndfm=pd.read_json('https://raw.githubusercontent.com/alexwarstadt/blimp/master/raw_results/summary/models_summary.jsonl',lines=True)\ndf=dfm.join(dfh)\ndf['diff']=df.total_mean - df.gpt2\nblimp_hard = set(df[df['diff']>0.1].UID)\ndel dfh, dfm, df\n\nblimp_groups = {\n \"syntax\": [\n  \"adjunct_island\",\n  \"animate_subject_passive\",\n  \"animate_subject_trans\",\n  \"causative\",\n  \"complex_NP_island\",\n  \"coordinate_structure_constraint_complex_left_branch\",\n  \"coordinate_structure_constraint_object_extraction\",\n  \"drop_argument\",\n  \"ellipsis_n_bar_1\",\n  \"ellipsis_n_bar_2\",\n  \"inchoative\",\n  \"intransitive\",\n  \"left_branch_island_echo_question\",\n  \"left_branch_island_simple_question\",\n  \"passive_1\",\n  \"passive_2\",\n  \"sentential_subject_island\",\n  \"transitive\",\n  \"wh_island\",\n  \"wh_questions_object_gap\",\n  \"wh_questions_subject_gap\",\n  \"wh_questions_subject_gap_long_distance\",\n  \"wh_vs_that_no_gap\",\n  \"wh_vs_that_no_gap_long_distance\",\n  \"wh_vs_that_with_gap\",\n  \"wh_vs_that_with_gap_long_distance\"\n ],\n \"morphology\": [\n  \"anaphor_gender_agreement\",\n  \"anaphor_number_agreement\",\n  \"determiner_noun_agreement_1\",\n  \"determiner_noun_agreement_2\",\n  \"determiner_noun_agreement_irregular_1\",\n  \"determiner_noun_agreement_irregular_2\",\n  \"determiner_noun_agreement_with_adj_2\",\n  \"determiner_noun_agreement_with_adj_irregular_1\",\n  \"determiner_noun_agreement_with_adj_irregular_2\",\n  \"determiner_noun_agreement_with_adjective_1\",\n  \"distractor_agreement_relational_noun\",\n  \"distractor_agreement_relative_clause\",\n  \"irregular_past_participle_adjectives\",\n  \"irregular_past_participle_verbs\",\n  \"irregular_plural_subject_verb_agreement_1\",\n  \"irregular_plural_subject_verb_agreement_2\",\n  \"regular_plural_subject_verb_agreement_1\",\n  \"regular_plural_subject_verb_agreement_2\"\n ],\n \"syntax_semantics\": [\n  \"existential_there_object_raising\",\n  \"existential_there_subject_raising\",\n  \"expletive_it_object_raising\",\n  \"only_npi_scope\",\n  \"principle_A_c_command\",\n  \"principle_A_case_1\",\n  \"principle_A_domain_1\",\n  \"principle_A_domain_2\",\n  \"principle_A_domain_3\",\n  \"principle_A_reconstruction\",\n  \"sentential_negation_npi_scope\",\n  \"tough_vs_raising_1\",\n  \"tough_vs_raising_2\"\n ],\n \"semantics\": [\n  \"existential_there_quantifiers_1\",\n  \"existential_there_quantifiers_2\",\n  \"matrix_question_npi_licensor_present\",\n  \"npi_present_1\",\n  \"npi_present_2\",\n  \"only_npi_licensor_present\",\n  \"sentential_negation_npi_licensor_present\",\n  \"superlative_quantifiers_1\",\n  \"superlative_quantifiers_2\"\n ],\n \"syntax/semantics\": [\n  \"principle_A_case_2\"\n ]\n}\n"
  },
  {
    "path": "src/tasksource/metadata/original.txt",
    "content": "WANLI\nrecast/recast_verbnet\nrecast/recast_verbcorner\nrecast/recast_ner\nrecast/recast_sentiment\nrecast/recast_puns\nrecast/recast_factuality\nrecast/recast_megaveridicality\nprobability_words_nli/reasoning_1hop\nprobability_words_nli/usnli\nprobability_words_nli/reasoning_2hop\nnan-nli/joey234--nan-nli\nnli_fever\nbreaking_nli\nconj_nli\nfracas\ndialogue_nli\nmpe\ndnc\nrecast_white/fnplus\nrecast_white/sprl\nrecast_white/dpr\nrobust_nli/IS_CS\nrobust_nli/LI_LI\nrobust_nli/ST_WO\nrobust_nli/PI_SP\nrobust_nli/PI_CD\nrobust_nli/ST_SE\nrobust_nli/ST_NE\nrobust_nli/ST_LM\nrobust_nli_is_sd\nrobust_nli_li_ts\ngen_debiased_nli/snli_seq_z\ngen_debiased_nli/snli_z_aug\ngen_debiased_nli/snli_par_z\ngen_debiased_nli/mnli_par_z\ngen_debiased_nli/mnli_z_aug\ngen_debiased_nli/mnli_seq_z\nadd_one_rte\nhlgd\nconll2003/pos_tags\nconll2003/chunk_tags\nconll2003/ner_tags\nhh-rlhf\nmodel-written-evals\nfig-qa\nsocial_i_qa\nbalanced-copa\ne-CARE\ninsincere-questions\nTuringBench\nvitaminc/tals--vitaminc\nrumoureval_2019/RumourEval2019\ntweet_eval/irony\ntweet_eval/stance_abortion\ntweet_eval/hate\ntweet_eval/stance_atheism\ntweet_eval/stance_climate\ntweet_eval/emoji\ntweet_eval/offensive\ntweet_eval/sentiment\ntweet_eval/emotion\ntweet_eval/stance_feminist\ntweet_eval/stance_hillary\ndiscovery/discovery\npragmeval/verifiability\npragmeval/mrda\npragmeval/switchboard\npragmeval/emergent\npragmeval/gum\npragmeval/sarcasm\npragmeval/stac\npragmeval/pdtb\nsilicone/dyda_e\nsilicone/oasis\nsilicone/meld_s\nsilicone/meld_e\nsilicone/maptask\nsilicone/dyda_da\nsilicone/sem\nsilicone/iemocap\nlex_glue/scotus\nlex_glue/ledgar\nlanguage-identification\nrotten_tomatoes\nhate_speech18\nsms_spam\nsnips_built_in_intents\nhate_speech_offensive\nhyperpartisan_news\nsciie\ncitation_intent\nscicite\nlexical_relation_classification/ROOT09\nlexical_relation_classification/CogALexV\nlexical_relation_classification/K&H+N\nlexical_relation_classification/BLESS\nlexical_relation_classification/EVALution\ncrowdflower/political-media-bias\ncrowdflower/tweet_global_warming\ncrowdflower/text_emotion\ncrowdflower/political-media-message\ncrowdflower/political-media-audience\ncrowdflower/economic-news\ncrowdflower/corporate-messaging\ncrowdflower/airline-sentiment\ncrowdflower/sentiment_nuclear_power\nethics/commonsense\nethics/deontology\nethics/justice\nethics/virtue\ntweets_hate_speech_detection\nwnut_17/wnut_17\nncbi_disease/ncbi_disease\nacronym_identification\njnlpba/jnlpba\nontonotes_english/SpeedOfMagic--ontonotes_english\nblog_authorship_corpus/gender\nblog_authorship_corpus/horoscope\nblog_authorship_corpus/job\nopen_question_type\nmc_taco\ndiscosense\nEffectiveFeedbackStudentWriting\nphrase_similarity\nscientific-exaggeration-detection\nfever-evidence-related/mwong--fever-related\ndynasent/dynabench.dynasent.r1.all/r1\ndynasent/dynabench.dynasent.r2.all/r2\nsem_eval_2010_task_8\nmedmcqa\nlogiqa\ncycic_classification\ncycic_multiplechoice\ncommonsense_qa_2.0\nlingnli\nmonotonicity-entailment\narct\nscinli\nnaturallogic\nonestop_qa\nmoral_stories/full\nprost\ndynahate\nsyntactic-augmentation-nli\nautotnli\nCONDAQA\nwebgpt_comparisons\nsynthetic-instruct-gptj-pairwise\nscruples\nwouldyourather\nattempto-nli\ndefeasible-nli/snli\ndefeasible-nli/atomic\nhelp-nli\nnli-veridicality-transitivity\nnatural-language-satisfiability\nlonli\ndadc-limit-nli\nFLUTE\nsummarize_from_feedback/comparisons\nfolio\ntomi-nli\navicenna\nSHP\nMedQA-USMLE-4-options-hf\nwikimedqa/medwiki\ncicero\nmutual\nNeQA\nquote-repetition\nredefine-math\npuzzte\nimplicatures\nrace-c\nspartqa-yn\nspartqa-mchoice\ntemporal-nli\nriddle_sense\nclcd-english\ntwentyquestions\nreclor\ncounterfactually-augmented-imdb\ncounterfactually-augmented-snli\ncnli\nboolq-natural-perturbations\nequate\nScienceQA_text_only\nekar_english\nimplicit-hate-stg1\nlogiqa-2.0-nli\nPARARULE-Plus\nmindgames\nuniversal_dependencies/en_partut/deprel\nuniversal_dependencies/en_lines/deprel\nuniversal_dependencies/en_gum/deprel\nuniversal_dependencies/en_ewt/deprel\nambient\npath-naturalness-prediction\ncloth\ndgen\noasst1_pairwise_rlhf_reward\nI2D2\nargs_me\nTouche23-ValueEval\nstarcon\nbanking77\nruletaker\nlsat_qa/all\nConTRoL-nli\ntracie\nsherliic\nsen-making/1\nsen-making/2\nmbib-base/cognitive-bias\nmbib-base/fake-news\nmbib-base/gender-bias\nmbib-base/hate-speech\nmbib-base/linguistic-bias\nmbib-base/political-bias\nmbib-base/racial-bias\nmbib-base/text-level-bias\nrobustLR\nv1/gen_train234_test2to10\nlogical-fallacy\nparade\ncladder\nsubjectivity\nMOH\nVUAC\nTroFi\nsharc_modified/mod\nconceptrules_v2\ndisrpt/eng.dep.scidtb\nconll2000\nfew-nerd/supervised\ncom2sense\nscone\nwinodict\nfool-me-twice\nmonli\ncorr2cause\napt\ntwitter-financial-news-sentiment\nSpaceNLI\npropsegment/nli\nHatemojiBuild\nregset\nesci\ndnd_style_intents\n"
  },
  {
    "path": "src/tasksource/metadata/popularity.py",
    "content": "dataset_rank = {'glue': 0,\r\n 'super_glue': 12,\r\n 'tweet_eval': 23,\r\n 'blimp': 34,\r\n 'imdb': 101,\r\n 'wikitext': 102,\r\n 'squad': 106,\r\n 'trec': 107,\r\n 'openwebtext': 108,\r\n 'rotten_tomatoes': 109,\r\n 'anli': 110,\r\n 'adversarial_qa': 111,\r\n 'ai2_arc': 115,\r\n 'xsum': 117,\r\n 'amazon_reviews_multi': 118,\r\n 'ag_news': 125,\r\n 'yelp_review_full': 126,\r\n 'wino_bias': 127,\r\n 'piqa': 131,\r\n 'duorc': 132,\r\n 'quail': 134,\r\n 'trivia_qa': 135,\r\n 'cnn_dailymail': 143,\r\n 'common_gen': 146,\r\n 'sst': 147,\r\n 'conll2003': 150,\r\n 'financial_phrasebank': 151,\r\n 'babi_qa': 155,\r\n 'poem_sentiment': 163,\r\n 'dream': 164,\r\n 'paws': 165,\r\n 'emotion': 168,\r\n 'kilt_tasks': 169,\r\n 'sciq': 180,\r\n 'cos_e': 181,\r\n 'dbpedia_14': 183,\r\n 'newsgroup': 184,\r\n 'cosmos_qa': 244,\r\n 'squad_v2': 245,\r\n 'samsum': 246,\r\n 'amazon_polarity': 247,\r\n 'multi_news': 248,\r\n 'wiki_hop': 249,\r\n 'quartz': 251,\r\n 'qasc': 252,\r\n 'wiki_qa': 253,\r\n 'openbookqa': 254,\r\n 'ropes': 256,\r\n 'quoref': 257,\r\n 'snli': 258,\r\n 'app_reviews': 259,\r\n 'gigaword': 260,\r\n 'wiki_bio': 261,\r\n 'amazon_us_reviews': 262,\r\n 'scan': 308,\r\n 'race': 320,\r\n 'swag': 323,\r\n 'codah': 325,\r\n 'ccdv/arxiv-summarization': 331,\r\n 'subjqa': 333,\r\n 'universal_morphologies': 339,\r\n 'hans': 447,\r\n 'sst2': 448,\r\n 'guardian_authorship': 449,\r\n 'math_qa': 465,\r\n 'librispeech_asr': 466,\r\n 'hendrycks_test': 469,\r\n 'openai_humaneval': 526,\r\n 'ptb_text_only': 527,\r\n 'pubmed_qa': 528,\r\n 'head_qa': 531,\r\n 'ought/raft': 533,\r\n 'ade_corpus_v2': 544,\r\n 'cbt': 547,\r\n 'bookcorpus': 552,\r\n 'squadshifts': 553,\r\n 'story_cloze': 557,\r\n 'multi_nli': 559,\r\n 'qanta': 560,\r\n 'hate_speech18': 564,\r\n 'gem': 565,\r\n 'lex_glue': 599,\r\n 'deepmind/code_contests': 606,\r\n 'imagenet-1k': 607,\r\n 'blended_skill_talk': 608,\r\n 'sms_spam': 609,\r\n 'asset': 610,\r\n 'fever': 612,\r\n 'commonsense_qa': 615,\r\n 'scientific_papers': 616,\r\n 'evidence_infer_treatment': 618,\r\n 'hotpot_qa': 620,\r\n 'superb': 622,\r\n 'sick': 628,\r\n 'humicroedit': 629,\r\n 'snips_built_in_intents': 631,\r\n 'winograd_wsc': 632,\r\n 'bigbench': 634,\r\n 'multi_woz_v22': 801,\r\n 'lambada': 803,\r\n 'banking77': 804,\r\n 'hate_speech_offensive': 805,\r\n 'yahoo_answers_topics': 806,\r\n 'ccdv/cnn_dailymail': 807,\r\n 'hyperpartisan_news_detection': 810,\r\n 'gsm8k': 812,\r\n 'wikisql': 814,\r\n 'the_pile': 815,\r\n 'health_fact': 825,\r\n 'mdd': 826,\r\n 'web_questions': 830,\r\n 'ethos': 831,\r\n 'wnut_17': 833,\r\n 'medical_questions_pairs': 834,\r\n 'scitldr': 835,\r\n 'drop': 838,\r\n 'squad_adversarial': 839,\r\n 'e2e_nlg_cleaned': 841,\r\n 'onestop_english': 842,\r\n 'pragmeval': 843,\r\n 'relbert/analogy_questions': 863,\r\n 'nq_open': 869,\r\n 'daily_dialog': 870,\r\n 'mc_taco': 871,\r\n 'crows_pairs': 872,\r\n 'go_emotions': 873,\r\n 'ncbi_disease': 875,\r\n 'boolq': 876,\r\n 'movie_rationales': 877,\r\n 'climate_fever': 878,\r\n 'discovery': 879,\r\n 'lama': 881,\r\n 'ecthr_cases': 885,\r\n 'jfleg': 887,\r\n 'selqa': 888,\r\n 'acronym_identification': 892,\r\n 'scicite': 893,\r\n 'tab_fact': 894,\r\n 'wiki_asp': 896,\r\n 'enriched_web_nlg': 916,\r\n 'svhn': 918,\r\n 'docred': 920,\r\n 'conllpp': 921,\r\n 'liar': 922,\r\n 'multi_x_science_sum': 923,\r\n 'discofuse': 924,\r\n 'competition_math': 926,\r\n 'biosses': 927,\r\n 'jnlpba': 928,\r\n 'web_nlg': 929,\r\n 'qa_srl': 937,\r\n 'neural_code_search': 938,\r\n 'conv_ai_2': 940,\r\n 'craigslist_bargains': 941,\r\n 'qed': 942,\r\n 'conv_ai_3': 943,\r\n 'conv_ai': 944,\r\n 'turk': 945,\r\n 'covid_qa_castorini': 946,\r\n 'sem_eval_2014_task_1': 947,\r\n 'mwsc': 948,\r\n 'gutenberg_time': 949,\r\n 'billsum': 950,\r\n 'riddle_sense': 951,\r\n 'species_800': 952,\r\n 'hlgd': 953,\r\n 'definite_pronoun_resolution': 954,\r\n 'tmu_gfm_dataset': 955,\r\n 'relbert/semeval2012_relational_similarity_v4': 956,\r\n 'clinc_oos': 957,\r\n 'imppres': 960,\r\n 'mrqa': 976,\r\n 'cc_news': 977,\r\n 'lmqg/qag_tweetqa': 978,\r\n 'aeslc': 979,\r\n 'big_patent': 980,\r\n 'eli5': 990,\r\n 'scene_parse_150': 991,\r\n 'circa': 993,\r\n 'aqua_rat': 994,\r\n 'nlu_evaluation_data': 996,\r\n 'newspop': 997,\r\n 'relbert/lexical_relation_classification': 998,\r\n 'yahoo_answers_qa': 1003,\r\n 'emo': 1004,\r\n 'silicone': 1005,\r\n 'cord19': 1015,\r\n 'tweet_qa': 1018,\r\n 'meta_woz': 1019,\r\n 'md_gender_bias': 1021,\r\n 'art': 1031,\r\n 'google_wellformed_query': 1032,\r\n 'ambig_qa': 1033,\r\n 'taskmaster2': 1035,\r\n 'quac': 1042,\r\n 'freebase_qa': 1043,\r\n 'quora': 1044,\r\n 'numer_sense': 1045,\r\n 'narrativeqa': 1046,\r\n 'ccdv/pubmed-summarization': 1047,\r\n 'qa_zre': 1049,\r\n 'limit': 1050,\r\n 'tweets_hate_speech_detection': 1051,\r\n 'mocha': 1052,\r\n 'hatexplain': 1053,\r\n 'bing_coronavirus_query_set': 1054,\r\n 'great_code': 1055,\r\n 'medal': 1056,\r\n 'sent_comp': 1057,\r\n 'kelm': 1058,\r\n 'natural_questions': 1059,\r\n 'wiki_split': 1061,\r\n 'zest': 1062,\r\n 'cfq': 1063,\r\n 'multi_re_qa': 1071,\r\n 'stereoset': 1080,\r\n 'coqa': 1082,\r\n 'cuad': 1083,\r\n 'break_data': 1084,\r\n 'mbpp': 1089,\r\n 'knkarthick/dialogsum': 1091,\r\n 'wiki_auto': 1092,\r\n 'pile-of-law/pile-of-law': 1097,\r\n 'pg19': 1132,\r\n 'DFKI-SLT/few-nerd': 1133,\r\n 'wikicorpus': 1136,\r\n 'e2e_nlg': 1142,\r\n 'anton-l/superb': 1143,\r\n 'ghomasHudson/muld': 1144,\r\n 'Exr0n/wiki-entity-similarity': 1150,\r\n 'BeIR/nfcorpus': 1156,\r\n 'ccdv/govreport-summarization': 1158,\r\n 'woz_dialogue': 1159,\r\n 'reddit': 1164,\r\n 'EMBO/sd-nlp': 1165,\r\n 'empathetic_dialogues': 1170,\r\n 'BeIR/fiqa': 1171,\r\n 'generics_kb': 1173,\r\n 'swda': 1177,\r\n 'wikitablequestions': 1178,\r\n 'pubmed': 1183,\r\n 'chr_en': 1184,\r\n 'sharc': 1185,\r\n 'sharc_modified': 1186,\r\n 'BeIR/scifact': 1190,\r\n 'nell': 1192,\r\n 'patriziobellan/PET': 1196,\r\n 'EMBO/biolang': 1198,\r\n 'dynabench/qa': 1202,\r\n 'reddit_tifu': 1206,\r\n 'BeIR/scidocs': 1208,\r\n 'pec': 1210,\r\n 'tner/tweetner7': 1213,\r\n 'BeIR/arguana': 1214,\r\n 'multidoc2dial': 1216,\r\n 'taskmaster1': 1219,\r\n 'spider': 1221,\r\n 'adv_glue': 1222,\r\n 'allenai/mslr2022': 1228,\r\n 'conceptnet5': 1230,\r\n 'tyqiangz/multilingual-sentiments': 1233,\r\n 'newsqa': 1246,\r\n 'metashift': 1249,\r\n 'so_stacksample': 1250,\r\n 'doc2dial': 1253,\r\n 'search_qa': 1256,\r\n 'yhavinga/mc4_nl_cleaned': 1258,\r\n 'hope_edi': 1270,\r\n 'proto_qa': 1273,\r\n 'tuple_ie': 1276,\r\n 'simple_questions_v2': 1279,\r\n 'nlpaueb/finer-139': 1282,\r\n 'bookcorpusopen': 1283,\r\n 'tner/ontonotes5': 1284,\r\n 'crd3': 1285,\r\n 'ucberkeley-dlab/measuring-hate-speech': 1286,\r\n 'gap': 1287,\r\n 'recipe_nlg': 1288,\r\n 'schema_guided_dstc8': 1289,\r\n 'BeIR/beir': 1291,\r\n 'sagnikrayc/mctest': 1294,\r\n 'eurlex': 1296,\r\n 'corypaik/coda': 1297,\r\n 'bc2gm_corpus': 1298,\r\n 'ascent_kb': 1299,\r\n 'curiosity_dialogs': 1301,\r\n 'covid_qa_deepset': 1302,\r\n 'air_dialogue': 1303,\r\n 'taskmaster3': 1305,\r\n 'xsum_factuality': 1306,\r\n 'medical_dialog': 1308,\r\n 'BeIR/trec-covid': 1312,\r\n 'lhoestq/test': 1314,\r\n 'newsroom': 1315,\r\n 'tne': 1316,\r\n 'covid_qa_ucsd': 1317,\r\n 'fhamborg/news_sentiment_newsmtsc': 1319,\r\n 'prachathai67k': 1321,\r\n 'cardiffnlp/tweet_topic_multi': 1322,\r\n 'datacommons_factcheck': 1323,\r\n 'deal_or_no_dialog': 1325,\r\n 'ubuntu_dialogs_corpus': 1327,\r\n 'eu_regulatory_ir': 1329,\r\n 'scifact': 1331,\r\n 'wi_locness': 1333,\r\n 'relbert/relation_mapping': 1335,\r\n 'coastalcph/fairlex': 1336,\r\n 'asnq': 1340,\r\n 'peer_read': 1341,\r\n 'metaeval/linguisticprobing': 1343,\r\n 'jigsaw_unintended_bias': 1353,\r\n 'totto': 1354,\r\n 'irc_disentangle': 1355,\r\n 'med_hop': 1357,\r\n 'numeric_fused_head': 1359,\r\n 'ollie': 1361,\r\n 'per_sent': 1363,\r\n 'SocialGrep/ten-million-reddit-answers': 1364,\r\n 'lmqg/qg_squad': 1366,\r\n 's2orc': 1367,\r\n 'Hellisotherpeople/DebateSum': 1368,\r\n 'SocialGrep/reddit-crypto-aug-2021': 1369,\r\n 'jigsaw_toxicity_pred': 1371,\r\n 'GroNLP/ik-nlp-22_slp': 1372,\r\n 'SocialGrep/reddit-nonewnormal-complete': 1374,\r\n 'SocialGrep/reddit-wallstreetbets-aug-2021': 1376,\r\n 'SocialGrep/the-reddit-covid-dataset': 1378,\r\n 'SocialGrep/top-american-universities-on-reddit': 1380,\r\n 'BeIR/beir-corpus': 1382,\r\n 'SocialGrep/one-year-of-r-india': 1384,\r\n 'BritishLibraryLabs/EThOS-PhD-metadata': 1386,\r\n 'librispeech_lm': 1388,\r\n 'few_rel': 1389,\r\n 'arxiv_dataset': 1390,\r\n 'lc_quad': 1391,\r\n 'diplomacy_detection': 1392,\r\n 'lmqg/qa_squadshifts_pseudo': 1393,\r\n 'grail_qa': 1461,\r\n 'tner/wnut2017': 1462,\r\n 'demo-org/auditor_review': 1463,\r\n 'allenai/real-toxicity-prompts': 1464,\r\n 'BeIR/nfcorpus-qrels': 1465,\r\n 'onestop_qa': 1466,\r\n 'demelin/moral_stories': 1467,\r\n 'atomic': 1493,\r\n 'crawl_domain': 1494,\r\n 'BeIR/quora': 1495,\r\n 'Abirate/english_quotes': 1497,\r\n 'narrativeqa_manual': 1498,\r\n 'BeIR/fiqa-qrels': 1499,\r\n 'social_bias_frames': 1500,\r\n 'pkavumba/balanced-copa': 1501,\r\n 'eraser_multi_rc': 1502,\r\n 'sled-umich/TRIP': 1503,\r\n 'opinosis': 1504,\r\n 'PiC/phrase_sense_disambiguation': 1505,\r\n 'enwik8': 1506,\r\n 'sem_eval_2020_task_11': 1508,\r\n 'gooaq': 1509,\r\n 'linnaeus': 1510,\r\n 'hover': 1511,\r\n 'GonzaloA/fake_news': 1512,\r\n 'consumer-finance-complaints': 1513,\r\n 'ohsumed': 1514,\r\n 'casino': 1515,\r\n 'gfissore/arxiv-abstracts-2021': 1516,\r\n 'conv_questions': 1517,\r\n 'hate_offensive': 1518,\r\n 'sofc_materials_articles': 1519,\r\n 'wanyu/IteraTeR_human_sent': 1520,\r\n 'dialog_re': 1521,\r\n 'fake_news_english': 1522,\r\n 'dart': 1523,\r\n 'blog_authorship_corpus': 1524,\r\n 'msr_zhen_translation_parity': 1525,\r\n 'cryptonite': 1526,\r\n 'disfl_qa': 1527,\r\n 'olm/olm-CC-MAIN-2022-21-sampling-ratio-0.14775510204': 1528,\r\n 'olm/olm-CC-MAIN-2022-33-sampling-ratio-0.20': 1529,\r\n 'coarse_discourse': 1530,\r\n 'eth_py150_open': 1531,\r\n 'event2Mind': 1532,\r\n 'Paul/hatecheck': 1533,\r\n 'eli5_category': 1534,\r\n 'hippocorpus': 1535,\r\n 'the_pile_books3': 1536,\r\n 'coached_conv_pref': 1537,\r\n 'has_part': 1538,\r\n 'times_of_india_news_headlines': 1539,\r\n 'medmcqa': 1540,\r\n 'Babelscape/rebel-dataset': 1541,\r\n 'glucose': 1542,\r\n 'msr_text_compression': 1543,\r\n 'msr_genomics_kbcomp': 1544,\r\n 'SpeedOfMagic/ontonotes_english': 1545,\r\n 'msr_sqa': 1546,\r\n 'wiki_movies': 1547,\r\n 'hybrid_qa': 1548,\r\n 'metooma': 1549,\r\n 'multi_nli_mismatch': 1550,\r\n 'text2log': 1551,\r\n 'the_pile_stack_exchange': 1552,\r\n 're_dial': 1553,\r\n 'inquisitive_qg': 1554,\r\n 'SocialGrep/one-million-reddit-jokes': 1555,\r\n 'time_dial': 1556,\r\n 'BeIR/scifact-qrels': 1557,\r\n 'sede': 1558,\r\n 'mutual_friends': 1559,\r\n 'pass': 1560,\r\n 'allenai/multi_lexsum': 1561,\r\n 'youtube_caption_corrections': 1562,\r\n 'NbAiLab/norec_agg': 1563,\r\n 'DanL/scientific-challenges-and-directions-dataset': 1564,\r\n 'SocialGrep/one-million-reddit-questions': 1565,\r\n 'Motahar/github-issues': 1566,\r\n 'SocialGrep/the-2022-trucker-strike-on-reddit': 1567,\r\n 'allenai/qasper': 1568,\r\n 'CyranoB/polarity': 1569,\r\n 'SocialGrep/one-million-reddit-confessions': 1570,\r\n 'debatelab/deepa2': 1571,\r\n 'bhavnicksm/sentihood': 1572,\r\n 'debatelab/aaac': 1573,\r\n 'jgammack/SAE-door-abstracts': 1574,\r\n 'erwanlc/cocktails_recipe': 1575,\r\n 'erwanlc/cocktails_recipe_no_brand': 1576,\r\n 'BeIR/arguana-qrels': 1577,\r\n 'tner/fin': 1578,\r\n 'BeIR/scidocs-qrels': 1579,\r\n 'tner/bc5cdr': 1580,\r\n 'olm/olm-CC-MAIN-2022-27-sampling-ratio-0.16142697881': 1581,\r\n 'BeIR/fever': 1582,\r\n 'cardiffnlp/tweet_topic_single': 1584,\r\n 'speechcolab/gigaspeech': 1585,\r\n 'BeIR/webis-touche2020': 1586,\r\n 'aquamuse': 1588,\r\n 'olm/olm-CC-MAIN-2022-40-sampling-ratio-0.15894621295': 1590,\r\n 'tner/btc': 1591,\r\n 'truthful_qa': 1592,\r\n 'McGill-NLP/FaithDial': 1594,\r\n 'ekinakyurek/ftrace': 1595,\r\n 'tomasg25/scientific_lay_summarisation': 1597,\r\n 'tner/mit_restaurant': 1599,\r\n 'bigscience-biomedical/bioasq_task_b': 1600,\r\n 'strombergnlp/broad_twitter_corpus': 1619,\r\n 'tner/bionlp2004': 1620,\r\n 'metaeval/recast': 1621,\r\n 'the_pile_openwebtext2': 1629,\r\n 'taln-ls2n/inspec': 1630,\r\n 'lmqg/qa_squadshifts': 1631,\r\n 'BeIR/hotpotqa': 1636,\r\n 'jpwahle/machine-paraphrase-dataset': 1638,\r\n 'tner/mit_movie_trivia': 1639,\r\n 'tner/conll2003': 1640,\r\n 'OxAISH-AL-LLM/wiki_toxic': 1641,\r\n 'ccdv/WCEP-10': 1642,\r\n 'BeIR/trec-covid-qrels': 1646,\r\n 'g8a9/europarl_en-it': 1647,\r\n 'carblacac/twitter-sentiment-analysis': 1648,\r\n 'usc-isi/WikiConvert': 1649,\r\n 'visual_genome': 1650,\r\n 'florianbussmann/FUNSD-vu2020revising': 1660,\r\n 'Felix-ML/quoteli3': 1661,\r\n 'allenai/scico': 1662,\r\n 'drAbreu/bc4chemd_ner': 1663,\r\n 'tner/tweebank_ner': 1664,\r\n 'alisawuffles/WANLI': 1665,\r\n 'Team-PIXEL/rendered-bookcorpus': 1666,\r\n 'Team-PIXEL/rendered-wikipedia-english': 1667,\r\n 'wanyu/IteraTeR_full_sent': 1668,\r\n 'EMBO/BLURB': 1669,\r\n 'metaeval/crowdflower': 1676,\r\n 'AlexaAI/bold': 1685,\r\n 'metaeval/ethics': 1686,\r\n 'sileod/movie_recommendation': 1691,\r\n 'lmqg/qg_subjqa': 1692,\r\n 'copenlu/scientific-exaggeration-detection': 1699,\r\n 'esb/datasets': 1700,\r\n 'BeIR/msmarco': 1701,\r\n 'biwi_kinect_head_pose': 1703,\r\n 'BeIR/quora-qrels': 1704,\r\n 'wardenga/lsoie': 1705,\r\n 'nlphuji/vasr': 1707,\r\n 'BeIR/nq': 1708,\r\n 'BeIR/dbpedia-entity': 1710,\r\n 'sadrasabouri/ShahNegar': 1712,\r\n 'knkarthick/xsum': 1713,\r\n 'ColumbiaNLP/FLUTE': 1714,\r\n 'bigscience-biomedical/scitail': 1715,\r\n 'lmqg/qg_squadshifts': 1717,\r\n 'BeIR/climate-fever': 1722,\r\n 'PiC/phrase_retrieval': 1724,\r\n 'bdotloh/empathetic-dialogues-contexts': 1726,\r\n 'ccdv/mediasum': 1727,\r\n 'BeIR/msmarco-qrels': 1735,\r\n 'alexfabbri/answersumm': 1736,\r\n 'pszemraj/text2image-multi-prompt': 1737,\r\n 'shibing624/source_code': 1738,\r\n 'kensho/spgispeech': 1741,\r\n 'jamescalam/channel-metadata': 1742,\r\n 'EMBO/sd-nlp-non-tokenized': 1743,\r\n 'facebook/pmd': 1748,\r\n 'drt/kqa_pro': 1749,\r\n 'BeIR/fever-qrels': 1751,\r\n 'TheFusion21/PokemonCards': 1752,\r\n 'zeroshot/twitter-financial-news-sentiment': 1753,\r\n 'bigscience-biomedical/blurb': 1754,\r\n 'mteb/bucc-bitext-mining': 1759,\r\n 'pinecone/core-2020-05-10-deduplication': 1763,\r\n 'tals/vitaminc': 1764,\r\n 'BeIR/hotpotqa-qrels': 1765,\r\n 'gigant/ted_descriptions': 1766,\r\n 'jpwahle/autoencoder-paraphrase-dataset': 1767,\r\n 'beki/privy': 1768,\r\n 'Muennighoff/P3': 1770,\r\n 'jpwahle/dblp-discovery-dataset': 1771,\r\n 'taln-ls2n/kp20k': 1773,\r\n 'bigscience-biomedical/biosses': 1774,\r\n 'allenai/prosocial-dialog': 1776,\r\n 'pacovaldez/stackoverflow-questions': 1777,\r\n 'kasnerz/hitab': 1778,\r\n 'relbert/semeval2012_relational_similarity': 1779,\r\n 'sagnikrayc/snli-cf-kaushik': 1780,\r\n 'mwritescode/slither-audited-smart-contracts': 1781,\r\n 'BeIR/webis-touche2020-qrels': 1787,\r\n 'bigscience-biomedical/mednli': 1788,\r\n 'pinecone/movielens-recent-ratings': 1790,\r\n 'BeIR/dbpedia-entity-qrels': 1791,\r\n 'shanya/crd3': 1792,\r\n 'knkarthick/samsum': 1793,\r\n 'BeIR/climate-fever-qrels': 1794,\r\n 'BeIR/nq-qrels': 1795,\r\n 'sanchit-gandhi/librispeech_asr_dummy': 1796,\r\n 'taln-ls2n/semeval-2010-pre': 1797,\r\n 'Bingsu/openwebtext_20p': 1798,\r\n 'PolyAI/banking77': 1799,\r\n 'JulesBelveze/tldr_news': 1800,\r\n 'Freed-Wu/kodak': 1801,\r\n 'biglam/gutenberg-poetry-corpus': 1802,\r\n 'SocialGrep/reddit-r-bitcoin-data-for-jun-2022': 1803,\r\n 'taln-ls2n/kptimes': 1805,\r\n 'biglam/old_bailey_proceedings': 1806,\r\n 'launch/gov_report': 1807,\r\n 'knkarthick/AMI': 1810,\r\n 'voidful/NMSQA': 1811,\r\n 'DTU54DL/dmeo': 1812,\r\n 'FinanceInc/auditor_sentiment': 1813,\r\n 'jamescalam/unsplash-25k-photos': 1814,\r\n 'Tidrael/tsl_news': 1815,\r\n 'DTU54DL/common3k-train': 1816,\r\n 'okite97/news-data': 1817,\r\n 'lmqg/qa_squad': 1818,\r\n 'ConvLab/woz': 1819,\r\n 'ConvLab/camrest': 1820,\r\n 'ConvLab/metalwoz': 1821,\r\n 'kakaobrain/coyo-700m': 1822,\r\n 'taln-ls2n/kpbiomed': 1823,\r\n 'abhinavk/openpi_v2': 1826,\r\n 'mwong/fever-claim-related': 1831,\r\n 'ConvLab/tm1': 1832,\r\n 'joey234/nan-nli': 1833,\r\n 'ConvLab/tm2': 1834,\r\n 'ConvLab/tm3': 1835,\r\n 'ConvLab/kvret': 1836,\r\n 'ConvLab/sgd': 1837,\r\n 'relbert/semeval2012_relational_similarity_v5': 1838,\r\n 'cmudrc/wave-energy': 1839,\r\n 'llangnickel/long-covid-classification-data': 1840,\r\n 'webis/args_me': 1841,\r\n 'HuggingFaceM4/something_something_v2': 1844,\r\n 'ConvLab/dailydialog': 1845,\r\n 'huanggab/reddit_haiku': 1846,\r\n 'relbert/semeval2012_relational_similarity_v6': 1847,\r\n 'pszemraj/riddlesense_plusplus': 1848,\r\n 'rungalileo/20_Newsgroups_Fixed': 1849,\r\n 'DTU54DL/common-voice-test16k': 1850,\r\n 'lhoestq/custom_squad': 1851,\r\n 'merve/poetry': 1852,\r\n 'yoshitomo-matsubara/srsd-feynman_easy': 1853,\r\n 'nightingal3/fig-qa': 1854,\r\n 'matejklemen/vuamc': 1855,\r\n 'strombergnlp/twitter_pos': 1856,\r\n 'nlphuji/winogavil': 1858,\r\n 'DFKI-SLT/tacred': 1859,\r\n 'valurank/News_Articles_Categorization': 1861,\r\n 'nbroad/mediasum': 1862,\r\n 'asapp/slue': 1863,\r\n 'zbnsl/emoteModified': 1865,\r\n 'adsabs/WIESP2022-NER': 1866,\r\n 'arize-ai/ecommerce_reviews_with_language_drift': 1867,\r\n 'UCL-DARK/ludwig': 1868,\r\n 'Aunsiels/InfantBooks': 1874,\r\n 'openclimatefix/uk_pv': 1875,\r\n 'copenlu/fever_gold_evidence': 1876,\r\n 'rungalileo/mit_movies_fixed_connll_format': 1877,\r\n 'jamescalam/youtube-transcriptions': 1878,\r\n 'lmqg/qa_harvesting_from_wikipedia': 1879,\r\n 'qanastek/Biosses-BLUE': 1880,\r\n 'zeronix1020/Strawberry-Disease': 1881,\r\n 'dferndz/cSQuAD2': 1882,\r\n 'taln-ls2n/pubmed': 1883,\r\n 'BeIR/scidocs-generated-queries': 1884,\r\n 'jmhessel/newyorker_caption_contest': 1885,\r\n 'inverse-scaling/NeQA': 1915,\r\n 'DTU54DL/common-voice': 1916,\r\n 'turingbench/TuringBench': 1917,\r\n 'demelin/understanding_fables': 1937,\r\n 'RUCAIBox/Open-Dialogue': 1938,\r\n 'allenai/multinews_sparse_max': 1939,\r\n 'RamAnanth1/lex-fridman-podcasts': 1940,\r\n 'sled-umich/Conversation-Entailment': 1941,\r\n 'stevhliu/demo': 1942,\r\n 'svakulenk0/qrecc': 1943,\r\n 'arize-ai/movie_reviews_with_context_drift': 1944,\r\n 'launch/ampere': 1945,\r\n 'AnonymousSub/recipe_RL_data_roberta-base': 1946,\r\n 'dreamproit/bill_summary_us': 1947,\r\n 'bgstud/libri-whisper-raw': 1948,\r\n 'jpwahle/etpc': 1949,\r\n 'DTU54DL/common-native-proc': 1950,\r\n 'mbartolo/synQA': 1951,\r\n 'wanyu/IteraTeR_full_doc': 1952,\r\n 'wanyu/IteraTeR_human_doc': 1953,\r\n 'orieg/elsevier-oa-cc-by': 1954,\r\n 'climatebert/environmental_claims': 1955,\r\n 'SocialGrep/the-reddit-climate-change-dataset': 1956,\r\n 'KGraph/FB15k-237': 1958,\r\n 'KheemDH/data': 1959,\r\n 'mwong/fever-evidence-related': 1960,\r\n 'HuggingFaceM4/TGIF': 1961,\r\n 'BeIR/fever-generated-queries': 1962,\r\n 'nateraw/ade20k-tiny': 1963,\r\n 'BeIR/cqadupstack-qrels': 1964,\r\n 'knkarthick/highlightsum': 1965,\r\n 'RUCAIBox/Data-to-text-Generation': 1966,\r\n 'GateNLP/broad_twitter_corpus': 1967,\r\n 'Tidrael/finance-headlines': 1968,\r\n 'lmqg/qag_squad': 1969,\r\n 'pacovaldez/stackoverflow-questions-2016': 1970,\r\n 'BeIR/fiqa-generated-queries': 1971,\r\n 'BeIR/signal1m-generated-queries': 1972,\r\n 'MicPie/unpredictable_msdn-microsoft-com': 1973,\r\n 'zeroshot/twitter-financial-news-topic': 1974,\r\n 'inverse-scaling/quote-repetition': 1975,\r\n 'esc-bench/esc-diagnostic-backup': 1976,\r\n 'lmqg/qg_annotation': 1977,\r\n 'sileod/wep-probes': 1978,\r\n 'DTU54DL/common-voice-test3k': 1981,\r\n 'jakartaresearch/causalqa': 1982,\r\n 'copenlu/sufficient_facts': 2002,\r\n 'ConvLab/multiwoz21': 2005,\r\n 'arka0821/multi_document_summarization': 2006,\r\n 'strombergnlp/rumoureval_2019': 2007,\r\n 'rongzhangibm/NaturalQuestionsV2': 2008,\r\n 'Muennighoff/mbpp': 2009,\r\n 'RUCAIBox/Simplification': 2011,\r\n 'shubhamg2208/lexicap': 2012,\r\n 'olm/olm-wikipedia-20220701': 2013,\r\n 'esc-bench/esc-diagnostic-dataset': 2014,\r\n 'jpwahle/autoregressive-paraphrase-dataset': 2015,\r\n 'GabrielVidal/dead-by-daylight-perks': 2016,\r\n 'DTU54DL/common-proc-whisper': 2017,\r\n 'valurank/PoliticalBias': 2018,\r\n 'McGill-NLP/TopiOCQA': 2019,\r\n 'gsarti/magpie': 2020,\r\n 'BeIR/cqadupstack-generated-queries': 2021,\r\n 'MicPie/unpredictable_mmo-champion-com': 2022,\r\n 'RUCAIBox/Question-Generation': 2023,\r\n 'allenai/multinews_sparse_mean': 2024,\r\n 'demo-org/diabetes': 2025,\r\n 'StonyBrookNLP/tellmewhy': 2026,\r\n 'bergr7/weakly_supervised_ag_news': 2027,\r\n 'din0s/msmarco-nlgen': 2028,\r\n 'frankier/cross_domain_reviews': 2029,\r\n 'gart-labor/pumpnli': 2030,\r\n 'AndyChiang/cloth': 2031,\r\n 'olm/olm-CC-MAIN-2017-22-sampling-ratio-0.16178770949': 2032,\r\n 'bgstud/libri': 2033,\r\n 'DTU54DL/commonvoice_accent_test': 2034,\r\n 'lewtun/my-awesome-dataset': 2035,\r\n 'peixian/rtGender': 2036,\r\n 'pmc/open_access': 2039,\r\n 'uva-irlab/trec-cast-2019-multi-turn': 2043,\r\n 'DFKI-SLT/scidtb': 2044,\r\n 'surrey-nlp/PLOD-filtered': 2045,\r\n 'wanyu/IteraTeR_v2': 2046,\r\n 'strombergnlp/ipm_nel': 2047,\r\n 'HuggingFaceM4/charades': 2048,\r\n 'ncats/EpiSet4NER-v2': 2050,\r\n 'HuggingFaceM4/ActivitiyNet_Captions': 2051,\r\n 'sileod/discourse_marker_qa': 2052,\r\n 'yoshitomo-matsubara/srsd-feynman_medium': 2053,\r\n 'BeIR/nfcorpus-generated-queries': 2054,\r\n 'BeIR/trec-news-generated-queries': 2055,\r\n 'BeIR/robust04-generated-queries': 2056,\r\n 'BeIR/quora-generated-queries': 2057,\r\n 'valurank/Adult-content-dataset': 2058,\r\n 'launch/open_question_type': 2059,\r\n 'knkarthick/topicsum': 2060,\r\n 'yuningm/citesum': 2061,\r\n 'elihoole/asrs-aviation-reports': 2062,\r\n 'DeveloperOats/DBPedia_Classes': 2063,\r\n 'hoskinson-center/proof-pile': 2064,\r\n 'RUCAIBox/Summarization': 2065,\r\n 'RUCAIBox/Question-Answering': 2066,\r\n 'RUCAIBox/Story-Generation': 2067,\r\n 'RUCAIBox/Paraphrase': 2068,\r\n 'jakartaresearch/semeval-absa': 2069,\r\n 'tner/ttc_dummy': 2071,\r\n 'copenlu/citeworth': 2072,\r\n 'allenai/multinews_sparse_oracle': 2073,\r\n 'allenai/multixscience_sparse_oracle': 2074,\r\n 'allenai/multixscience_sparse_mean': 2075,\r\n 'allenai/multixscience_sparse_max': 2076,\r\n 'allenai/ms2_sparse_oracle': 2077,\r\n 'mschi/blogspot_raw': 2078,\r\n 'gaurikapse/civis-consultation-summaries': 2079,\r\n 'chenghao/cuad_qa': 2080,\r\n 'esc-bench/esc-datasets': 2081,\r\n 'olm/olm-wikipedia-20221001': 2082,\r\n 'allenai/wcep_dense_oracle': 2083,\r\n 'dennlinger/wiki-paragraphs': 2084,\r\n 'AndyChiang/dgen': 2085,\r\n 'esb/diagnostic-dataset': 2086,\r\n 'havens2/naacl2022': 2087,\r\n 'fkdosilovic/docee-event-classification': 2088,\r\n 'DTU54DL/demo-common-whisper': 2089,\r\n 'dferndz/cSQuAD1': 2090,\r\n 'jpcorb20/multidogo': 2091,\r\n 'julien-c/reactiongif': 2092,\r\n 'lara-martin/Scifi_TV_Shows': 2093,\r\n 'lukesjordan/worldbank-project-documents': 2094,\r\n 'mnemlaghi/widdd': 2095,\r\n 'mvarma/medwiki': 2096,\r\n 'nateraw/beans': 2098,\r\n 'nateraw/cats_vs_dogs': 2099,\r\n 'nateraw/food101': 2100,\r\n 'nateraw/sync_food101': 2101,\r\n 'ncats/EpiSet4BinaryClassification': 2102,\r\n 'ncats/EpiSet4NER-v1': 2103,\r\n 'peixian/equity_evaluation_corpus': 2104,\r\n 'rajeshradhakrishnan/malayalam_wiki': 2105,\r\n 'softcatala/open-source-english-catalan-corpus': 2106,\r\n 'toloka/CrowdSpeech': 2107,\r\n 'valurank/12-factor': 2108,\r\n 'valurank/PoliticalBias_AllSides_Txt': 2109,\r\n 'valurank/PoliticalBias_Sources': 2110,\r\n 'valurank/hate-multi': 2111,\r\n 'valurank/news-12factor': 2112,\r\n 'valurank/offensive-multi': 2113,\r\n 'webimmunization/COVID-19-vaccine-attitude-tweets': 2114,\r\n 'wpicard/nostradamus-propheties': 2115,\r\n 'yuanchuan/annotated_reference_strings': 2116,\r\n 'ruanchaves/stan_large': 2117,\r\n 'ruanchaves/stan_small': 2118,\r\n 'ruanchaves/boun': 2119,\r\n 'ruanchaves/dev_stanford': 2120,\r\n 'ruanchaves/test_stanford': 2121,\r\n 'ruanchaves/snap': 2122,\r\n 'z-uo/qasper-squad': 2123,\r\n 'SocialGrep/the-antiwork-subreddit-dataset': 2124,\r\n 'CLUTRR/v1': 2126,\r\n 'malteos/test2': 2132,\r\n 'TomTBT/pmc_open_access_xml': 2133,\r\n 'SocialGrep/the-reddit-dataset-dataset': 2137,\r\n 'SocialGrep/the-reddit-place-dataset': 2139,\r\n 'projecte-aina/gencata': 2141,\r\n 'mwong/climate-evidence-related': 2142,\r\n 'mwong/climate-claim-related': 2143,\r\n 'surrey-nlp/PLOD-unfiltered': 2144,\r\n 'SocialGrep/the-reddit-irl-dataset': 2145,\r\n 'Lexi/spanextract': 2147,\r\n 'mwong/climatetext-claim-related-evaluation': 2148,\r\n 'mwong/climatetext-evidence-related-evaluation': 2149,\r\n 'ylacombe/xsum_factuality': 2150,\r\n 'mwong/climatetext-climate_evidence-claim-related-evaluation': 2151,\r\n 'mwong/climatetext-claim-climate_evidence-related-evaluation': 2152,\r\n 'mwong/climatetext-evidence-claim-pair-related-evaluation': 2153,\r\n 'mwong/climatetext-claim-evidence-pair-related-evaluation': 2154,\r\n 'patrickvonplaten/librispeech_asr_self_contained': 2155,\r\n 'BritishLibraryLabs/web_archive_classification': 2158,\r\n 'albertxu/CrosswordQA': 2159,\r\n 'SocialGrep/the-reddit-nft-dataset': 2160,\r\n 'janck/bigscience-lama': 2162,\r\n 'strombergnlp/twitter_pos_vcb': 2163,\r\n 'Filippo/osdg_cd': 2164,\r\n 'Ukhushn/home-depot': 2165,\r\n 'pile-of-law/eoir_privacy': 2166,\r\n 'drAbreu/sd-nlp-2': 2168,\r\n 'Leyo/TGIF': 2173,\r\n 'strombergnlp/named_timexes': 2174,\r\n 'domenicrosati/TruthfulQA': 2175,\r\n 'Roh/ryanspeech': 2176,\r\n 'Leyo/ActivityNet_Captions': 2177,\r\n 'IsaacBot/SQuAD-single-sentence-QA': 2178,\r\n 'morteza/cogtext': 2179,\r\n 'wdc/products-2017': 2180,\r\n 'rajeshvarma/QA_on_SLA': 2196,\r\n 'statworx/haiku': 2197,\r\n 'rajistics/million-headlines': 2198,\r\n 'feyzaakyurek/BBNLI': 2199,\r\n 'launch/gov_report_qs': 2200,\r\n 'DFKI-SLT/wikitext_linked': 2202,\r\n 'dianalogan/Marketing-Budget-and-Actual-Sales-Dataset': 2204,\r\n 'mehnaazasad/arxiv-co-ga': 2205,\r\n 'JeremyAlain/123_test': 2206,\r\n 'BeIR/arguana-generated-queries': 2209,\r\n 'BeIR/climate-fever-generated-queries': 2210,\r\n 'BeIR/dbpedia-entity-generated-queries': 2211,\r\n 'wise-east/spolin': 2212,\r\n 'yoshitomo-matsubara/srsd-feynman_hard': 2213,\r\n 'florentgbelidji/edmunds-car-ratings': 2214,\r\n 'olivierdehaene/xkcd': 2215,\r\n 'rajistics/auditor_review': 2216,\r\n 'BeIR/scifact-generated-queries': 2217,\r\n 'BeIR/trec-covid-generated-queries': 2218,\r\n 'BeIR/webis-touche2020-generated-queries': 2219,\r\n 'BeIR/nq-generated-queries': 2220,\r\n 'BeIR/hotpotqa-generated-queries': 2221,\r\n 'BeIR/bioasq-generated-queries': 2222,\r\n 'icelab/ntrs_meta': 2223,\r\n 'iejMac/CLIP-Kinetics700': 2224,\r\n 'fever/feverous': 2225,\r\n 'Livingwithmachines/hmd-erwt-training': 2226,\r\n 'wkrl/cord': 2227,\r\n 'launch/reddit_qg': 2228,\r\n 'arize-ai/xtreme_en': 2229}\r\n\r\ndataset_rank['Anthropic/model-written-evals']=13\r\ndataset_rank['Anthropic/hh-rlhf']=14"
  },
  {
    "path": "src/tasksource/mtasks.py",
    "content": "from .preprocess import cat, get,name, regen, constant, Classification, TokenClassification, MultipleChoice\nfrom .metadata import udep_labels\nfrom datasets import get_dataset_config_names, ClassLabel, Dataset, DatasetDict, concatenate_datasets, Sequence\n\ndef all(dataset_name):\n    try:\n        config_name=get_dataset_config_names(dataset_name)\n    except Exception as e:\n        print(dataset_name,e)\n        config_name=None\n    return dict(dataset_name=dataset_name, config_name=config_name)\n\ndef concatenate_configs(dataset):\n    return DatasetDict(train=concatenate_datasets(list(dataset.values())))\n\n# english tasks (few, to keep balance between languages)\n\nmoritz_xnli = Classification(\"premise\",\"hypothesis\",name(\"label\",[\"entailment\", \"neutral\",\"contradiction\"]), \n    pre_process=concatenate_configs, \n    dataset_name=\"MoritzLaurer/multilingual-NLI-26lang-2mil7\")\n\nxnli = Classification(\"premise\", \"hypothesis\", \"label\", **all(\"metaeval/xnli\"))\n\namericas_nli = Classification(\"premise\",\"hypothesis\",\"label\",config_name=\"all_languages\")\n\nstsb_multi_mt = Classification(\"sentence1\", \"sentence2\",\n    lambda x: float(x[\"similarity_score\"]/5),\n    **all('stsb_multi_mt'))\n\npawsx = Classification(\"sentence1\",\"sentence2\",name('label',['not_paraphrase','paraphrase']), **all('paws-x'))\n\nmiam = Classification(\"Utterance\",labels=\"Label\", **all('miam'))\n\nxstance = Classification(\"question\", \"comment\", \"label\",\n    **all(\"strombergnlp/x-stance\"))\n\n\noffenseval = Classification(lambda x: str(x[\"text\"]), labels=name(\"subtask_a\",['not offensive','offensive']),\n    pre_process=lambda ds:ds.filter(lambda x:  x['subtask_a'] in [0,1]),\n    dataset_name='strombergnlp/offenseval_2020',\n    config_name=[\"ar\",\"da\",\"gr\",\"tr\"])\n\noffenseval_dravidian = Classification(\"text\",labels=\"label\",config_name=['kannada','malayalam','tamil'])\n\nmlma_hate = Classification(\"tweet\", labels=lambda x:x[\"sentiment\"].split('_'),\n    dataset_name=\"nedjmaou/MLMA_hate_speech\")\n\nqam = Classification(\"question\",\"answer\",\"label\", dataset_name=\"xglue\",config_name=\"qam\")\n\n#x_sum_factuality = Classification(\"summary\",\"generated_summary\",\"label\", dataset_name=\"ylacombe/xsum_factuality\")\n\nx_fact = Classification('evidence','claim','label', dataset_name=\"metaeval/x-fact\")\n\nxglue___nc = Classification('news_body',labels='news_category')\nxglue___qadsm = Classification('query','ad_description','relevance_label')\nxglue___qam = Classification('question','answer','label')\nxglue___wpr = Classification('query','web_page_snippet','relavance_label') # relavance_label : sic\n\nxlwic = Classification(\n    sentence1=cat([\"target_word\",\"context_1\"], \" : \"),\n    sentence2=cat([\"target_word\",\"context_2\"], \" : \"),\n    labels='label',dataset_name=\"pasinit/xlwic\",config_name=['xlwic_de_de','xlwic_it_it','xlwic_fr_fr','xlwic_en_ko'])\n\n#[ \"spam\", \"fails_task\", \"lang_mismatch\", \"pii\", \"not_appropriate\", \"hate_speech\", \"sexual_content\", \"quality\", \"toxicity\", \"humor\", \"helpfulness\", \"creativity\", \"violence\" ]\n\noasst1__quality = Classification(\"parent_text\",\"text\",labels=\"quality\", dataset_name=\"tasksource/oasst1_dense_flat\",\n    pre_process = lambda ds:ds.remove_columns('labels'))\noasst1__toxicity = Classification(\"parent_text\",\"text\",labels=\"toxicity\", dataset_name=\"tasksource/oasst1_dense_flat\",\n    pre_process = lambda ds:ds.remove_columns('labels'))\noasst1__helpfulness = Classification(\"parent_text\",\"text\",labels=\"helpfulness\", dataset_name=\"tasksource/oasst1_dense_flat\",\n    pre_process = lambda ds:ds.remove_columns('labels'))\n\n\nlanguage_identification = Classification(\"text\",labels=\"labels\", dataset_name=\"papluca/language-identification\")\nwili_2018_langid = Classification(\"sentence\",labels=\"label\",dataset_name=\"wili_2018\")\n\nexams = MultipleChoice(get.question.stem, choices_list=get.question.choices.text,\n    labels=lambda x:'ABCDE'.index(x['answerKey']),\n    dataset_name=\"exams\", config_name='multilingual',\n    pre_process=lambda ds:ds.filter(lambda x:  x['answerKey'] in \"ABCDE\"))\n\nxcsr = MultipleChoice(get.question.stem, choices_list=get.question.choices.text,\n    labels=lambda x:'ABCDE'.index(x['answerKey']),\n    **all('xcsr'))\n\nxcopa = MultipleChoice(\"premise\",choices=['choice1','choice2'],labels=\"label\",\n    **all('xcopa'))\n\n#xstory = MultipleChoice(constant(''),choices=[\"text_right_ending\",\"text_wrong_ending\"],labels=constant(0), **all(\"juletxara/xstory_cloze\"))\n\nxstory = MultipleChoice(lambda x: \"\\n\".join([x[f'input_sentence_{i}'] for i in range(1,5)]),\n    choices=[\"sentence_quiz1\",\"sentence_quiz2\"],labels=constant(0), **all(\"juletxara/xstory_cloze\"))\n\n\nxglue_ner = TokenClassification(\"words\",\"ner\", dataset_name=\"xglue\",config_name=\"ner\")\nxglue_pos = TokenClassification(\"words\",\"pos\", dataset_name=\"xglue\",config_name=\"pos\")\n\n#disrpt_23 = Classification(\"unit1_sent\", \"unit2_sent\", \"label\",**all(\"metaeval/disrpt\"))\n\nudep__pos = TokenClassification('tokens','upos', **all('universal_dependencies'))\n\ndef udep_post_process(ds):\n    return ds.cast_column('labels', Sequence(ClassLabel(names=udep_labels)))\n\n#udep__deprel = TokenClassification('tokens',lambda x:[udep_labels.index(a) for a in x['deprel']],\n#    **all('universal_dependencies'),post_process=udep_post_process)\n\noasst_rlhf = MultipleChoice(\"prompt\",choices=['chosen','rejected'],labels=constant(0),\n    dataset_name=\"tasksource/oasst1_pairwise_rlhf_reward\")\n\nsentiment = Classification(\"text\",labels=\"label\", dataset_name=\"tyqiangz/multilingual-sentiments\",config_name=\"all\",\n    pre_process=lambda ds:ds.filter(lambda x: \"amazon_reviews\" not in x['source']) )\ntweet_sentiment = Classification(\"text\", labels=\"label\", **all('cardiffnlp/tweet_sentiment_multilingual'))\nreview_sentiment = Classification(\"review_body\",labels=\"stars\", dataset_name=\"amazon_reviews_multi\",config_name=\"all_languages\")\nemotion = Classification(\"text\",labels=\"emotion\",dataset_name=\"metaeval/universal-joy\")\n# in mms\n\nmms_sentiment = Classification(\"text\",labels=\"label\",dataset_name='Brand24/mms')\n\nmapa_fine = TokenClassification(\"tokens\",\"coarse_grained\",dataset_name='joelito/mapa')\nmapa_corase = TokenClassification(\"tokens\",\"fine_grained\",dataset_name='joelito/mapa')\n\naces_ranking = MultipleChoice(\"source\",choices=['good-translation','incorrect-translation'],labels=constant(0), dataset_name='nikitam/ACES')\naces_phenomena = Classification('source','incorrect-translation','phenomena', dataset_name='nikitam/ACES')\n\namazon_intent = Classification(\"utt\",labels=\"intent\",**all('AmazonScience/massive'))\n#    dataset_name='glue',config_name=['ocnli','afqmc'])\n\ntidy_as2=Classification(\"Question\",\"Sentence\",\"Label\",dataset_name='tasksource/tydi-as2-balanced') \n\nmulticoner = TokenClassification(\"tokens\",\"ner_tags_index\", **all(\"MultiCoNER/multiconer_v2\"))\n\nmtop = Classification(\"question\",labels=\"intent\", dataset_name=\"tasksource/mtop\")\n\nmlabel_nli = Classification(\"premise\",\"hypothesis\",\"labels\",dataset_name=\"tasksource/multilingual-zero-shot-label-nli\")\n\n#wino_x\n# clue, klue, indic_glue\n# SMS_Spam_Multilingual_Collection_Dataset\n"
  },
  {
    "path": "src/tasksource/preprocess.py",
    "content": "from collections.abc import Iterable\nfrom dotwiz import DotWiz\nfrom dataclasses import dataclass\nfrom typing import Union\nimport itertools\nimport funcy as fc\nimport exrex \nimport magicattr \nimport numpy as np\nimport copy\nimport datasets\nimport time\n\nMAX_MC_OPTIONS = 4\n\ndef get_column_names(dataset):\n    cn = dataset.column_names\n    if type(cn)==dict:\n        return set(fc.flatten(cn.values()))\n    else:\n        return set(cn)\n\n\ndef sample_dataset(dataset,n=10000, n_eval=1000,seed=0):\n    for k in dataset:\n        n_k=(n if k=='train' else n_eval)\n        if n_k and len(dataset[k])>n_k:\n            dataset[k]=dataset[k].train_test_split(train_size=n_k,seed=seed)['train']\n    return dataset\n\nclass Preprocessing(DotWiz):\n    default_splits = ('train','validation','test')\n    _instances = []\n\n    def __post_init__(self):\n        Preprocessing._instances+=[self]\n\n    @staticmethod\n    def __map_to_target(x,fn=lambda x:None, target=None):\n        x[target]=fn(x)\n        return x\n        \n    def load(self):\n        return self(datasets.load_dataset(self.dataset_name,self.config_name))\n\n    def __call__(self,dataset, max_rows=None, max_rows_eval=None,seed=0):\n        dataset = self.pre_process(dataset)\n\n        # manage splits\n        for k,v in zip(self.default_splits, self.splits):\n            if v and k!=v:\n                dataset[k]=dataset[v]\n                del dataset[v]\n            if k in dataset and not v: # obfuscated label\n                del dataset[k]\n        dataset = fix_splits(dataset)\n\n        for k in list(dataset.keys()):\n            if k not in self.default_splits:\n                del dataset[k]\n        dataset = sample_dataset(dataset, max_rows, max_rows_eval,seed=seed)\n        \n        # field annotated with a string\n        substitutions = {v:k for k,v in self.to_dict().items()\n            if (k and k not in {'splits','dataset_name','config_name'} \n            and type(v)==str and k!=v)}\n\n        dataset=dataset.remove_columns([c for c in substitutions.values() if c in dataset['train'].features and c not in substitutions])\n        dataset=dataset.rename_columns(substitutions)\n\n        # field annotated with a function                                \n        for k in self.to_dict().keys():\n            v=getattr(self, k)\n            if callable(v) and k not in {\"post_process\",\"pre_process\",\"load\"}:\n                dataset=dataset.map(self.__map_to_target,\n                                    fn_kwargs={'fn':v,'target':k})\n\n        dataset=dataset.remove_columns(\n            get_column_names(dataset)-set(self.to_dict().keys()))\n        dataset = fix_labels(dataset)\n        dataset = fix_splits(dataset) # again: label mapping changed\n        dataset = self.post_process(dataset)\n        return dataset\n\n\n@dataclass\nclass cat(Preprocessing):\n    fields:Union[str,list]=None\n    separator:str=' '\n        \n    def __call__(self, example=None):\n        y=[np.char.array(example[f]) + sep \n                for f,sep in zip(self.fields[::-1],itertools.repeat(self.separator))]\n        y=list(sum(*y))\n        if len(y)==1:\n            y=y[0]\n        return y\n\n\ndef pretty(f):\n    class pretty_f(DotWiz):\n        def __init__(self,*args):\n            self.__f_arg = f(*args)\n            for a in args:\n                setattr(self,'value',a)\n                \n        def __call__(self, *args,**kwargs):\n            return self.__f_arg(*args,**kwargs)\n\n        def __repr__(self):\n            return f\"{self.__f_arg.__qualname__ .split('.')[0]}({self.value})\"\n    return pretty_f\n\nclass dotgetter:\n    def __init__(self, path=''):\n        self.path=path\n\n    def __bool__(self):\n        return bool(self.path)\n\n    def __getattr__(self, k):\n        return self.__class__(f'{self.path}.{k}'.lstrip('.'))\n    \n    def __getitem__(self, i):\n        return self.__class__(f'{self.path}[{i}]')\n\n    def __call__(self, example=None):\n        return magicattr.get(DotWiz(example), self.path)\n\n    def __hash__(self):\n        return hash(self.path)\n\n\n@dataclass\nclass ClassificationFields(Preprocessing):\n    sentence1:str='sentence1'\n    sentence2:str='sentence2'\n    labels:str='labels'\n\n@dataclass\nclass Seq2SeqLMFields(Preprocessing):\n    prompt:str='prompt'\n    output:str='output'\n\n@dataclass\nclass TokenClassificationFields(Preprocessing):\n    tokens:str='tokens'\n    labels:str='labels'\n        \n@dataclass\nclass MultipleChoiceFields(Preprocessing):\n    inputs:str='input'\n    choices:Iterable=tuple()\n    labels:str='labels'\n    choices_list:str=None\n    def __post_init__(self):\n        for i, c in enumerate(self.choices):\n            setattr(self,f'choice{i}',c)\n        delattr(self,'choices')\n        if not self.choices_list:\n            delattr(self,'choices_list')\n    \n    def __call__(self,dataset, *args, **kwargs):\n        dataset = super().__call__(dataset, *args, **kwargs)\n        if self.choices_list:\n            dataset = dataset.filter(lambda x: 1<len(x['choices_list']))\n            n_options = min([len(x) for k in dataset for x in dataset[k]['choices_list']])\n            n_options = min(MAX_MC_OPTIONS,n_options)\n            dataset = dataset.map(self.flatten_choice_list, fn_kwargs={'n_options':n_options})\n\n        else:\n            dataset = dataset.map(self.sample_choices, fn_kwargs={'n_options':MAX_MC_OPTIONS})\n        return dataset\n\n    @staticmethod\n    def flatten_choice_list(x, n_options=None):\n        n_neg = n_options-1 if n_options else None\n        choices = x['choices_list']\n        label=x['labels']\n        neg = choices[:label] + choices[label+1:]\n        pos = choices[label]\n        x['labels']=0\n        x['choices_list']=[pos]+neg[:n_neg]\n        for i,o in enumerate(x['choices_list']):\n            x[f'choice{i}']=o\n        del x['choices_list']\n        return x\n\n    @staticmethod\n    def sample_choices(x, n_options=None):\n        choices = [x[c] for c in x if 'choice' in c]\n        if not MAX_MC_OPTIONS or len(choices)<=n_options:\n            return x\n        n_neg = n_options-1 if n_options else None\n        label=x['labels']\n        neg = choices[:label] + choices[label+1:]\n        pos = choices[label]\n        x['labels']=0\n        choices_list=[pos]+neg[:n_neg]\n        for c in list(x):\n            if 'choice' in c:\n                del x[c]\n        for i,o in enumerate(choices_list):\n            x[f'choice{i}']=o\n        return x\n\n@dataclass\nclass SharedFields:\n    splits:list=Preprocessing.default_splits\n    dataset_name:str = None\n    config_name:str = None\n    pre_process: callable = fc.identity\n    post_process: callable = fc.identity\n    #language:str=\"en\"\n    \n\n@dataclass\nclass Classification(SharedFields, ClassificationFields): pass\n\n@dataclass\nclass MultipleChoice(SharedFields, MultipleChoiceFields): pass\n\n@dataclass\nclass TokenClassification(SharedFields, TokenClassificationFields): pass\n\n@dataclass\nclass Seq2SeqLM(SharedFields, Seq2SeqLMFields): pass\n\nget=dotgetter()\nconstant = pretty(fc.constantly)\nregen = lambda x: list(exrex.generate(x))\n\ndef name(label_name, classes):\n    return lambda x:classes[x[label_name]]\n\ndef fix_splits(dataset):\n\n    if len(dataset)==1 and \"train\" not in dataset:\n        k = list(dataset)[0]\n        dataset['train'] = copy.deepcopy(dataset[k])\n        del dataset[k]\n\n    if 'auxiliary_train' in dataset:\n        del dataset['auxiliary_train']\n    \n    if 'test' in dataset: # manage obfuscated labels\n        if 'labels' in dataset['test'].features:\n            if len(set(fc.flatten(dataset['test'].to_dict()['labels'])))==1:\n                del dataset['test']\n\n    if 'validation' in dataset and 'train' not in dataset:\n        train_validation = dataset['validation'].train_test_split(0.5, seed=0)\n        dataset['train'] = train_validation['train']\n        dataset['validation']=train_validation['test']\n    \n    if 'validation' in dataset and 'test' not in dataset:\n        validation_test = dataset['validation'].train_test_split(0.5, seed=0)\n        dataset['validation'] = validation_test['train']\n        dataset['test']=validation_test['test']\n\n    if 'train' in dataset and 'validation' not in dataset:\n        train_val = dataset['train'].train_test_split(train_size=0.90, seed=0)\n        dataset['train'] = train_val['train']\n        dataset['validation']=train_val['test']\n\n    if 'test' in dataset and 'validation' not in dataset:\n        validation_test = dataset['test'].train_test_split(0.5, seed=0)\n        dataset['validation'] = validation_test['train']\n        dataset['test']=validation_test['test']\n\n    if 'validation' not in dataset and 'test' not in dataset:\n        train_val_test = dataset[\"train\"].train_test_split(train_size=0.90, seed=0)\n        val_test = train_val_test[\"test\"].train_test_split(0.5, seed=0)\n        dataset[\"train\"] = train_val_test[\"train\"]\n        dataset[\"validation\"] = val_test[\"train\"]\n        dataset[\"test\"] = val_test[\"test\"]\n        \n    return dataset \n\ndef fix_labels(dataset, label_key='labels'):\n    if type(dataset['train'][label_key][0]) in [int,list,float]:\n        return dataset\n    labels=set(fc.flatten(dataset[k][label_key] for k in {\"train\"}))\n    if set(labels)=={'entailment','neutral','contradiction'}:\n        order=lambda x:dict(fc.flip(enumerate(['entailment','neutral','contradiction']))).get(x,x)\n    else:\n        order=str\n    labels=sorted(labels, key=order)\n    dataset=dataset.cast_column(label_key, datasets.ClassLabel(names=labels))\n    return dataset\n\ndef concatenate_dataset_dict(l):\n    \"\"\"Concatenate a list of DatastDict objects sharing same splits and columns.\"\"\"\n    keys=l[0].keys()\n    return datasets.DatasetDict({k: datasets.concatenate_datasets([x[k] for x in l]) for k in keys})"
  },
  {
    "path": "src/tasksource/recast.py",
    "content": "import random\nfrom datasets import DatasetDict, Dataset\nfrom sorcery import dict_of\nimport string\n\nimproper_labels =['recast/recast_kg_relations','linguisticprobing',\"lex_glue/scotus\",'lexical_relation_classification/ROOT09',\"pragmeval/squinky\",\"pragmeval/emobank\",'pragmeval/persuasiveness']\nimproper_labels += ['glue/stsb', 'sick/relatedness', 'joci', 'utilitarianism', 'amazon_counterfactual/en', 'toxic_conversations', 'ethos/multilabel', 'lex_glue/eurlex', 'lex_glue/unfair_tos', 'app_reviews', 'humicroedit/subtask-1', 'stackoverflow-questions', 'go_emotions/simplified', 'google_wellformed_query', 'has_part', 'blog_authorship_corpus/age', 'promptCoherence', 'Sarcasm_News_Headline', 'auditor_review/demo-org--auditor_review', 'Dynasent_Disagreement', 'Politeness_Disagreement', 'SBIC_Disagreement', 'SChem_Disagreement', 'Dilemmas_Disagreement', 'sts-companion', 'acceptability-prediction', 'chaos-mnli-ambiguity', 'headline_cause/en_simple', 'oasst1_dense_flat', 'civil_comments']\n\nimproper_labels += ['stsb_multi_mt','MLMA_hate_speech','icl-symbol-tuning-instruct','zero-shot-label-nli']\n\nimproper_labels += ['essay-scoring','english-grading','HelpSteer','oasst2']\n\ndef render_options(options):\n    options = [f'\"{x}\"' for x in options]\n    return f\"{', '.join(options[:-1])} or {options[-1]}\"\n\ndef render_classification(text,options,answer):\n    example = 'text_A→text_B' if text.startswith('text_A:') else 'the following'\n    inputs = f'With no explanation, label {example} with either {render_options(options)}.\\n{text}'\n    targets = f\"{answer}.\"\n    return dict_of(inputs,targets)\n\ndef render_token_classification(tokens,options,labels):\n    prefix = f'With no explanation, label each line with {render_options(options)} preceded by \":\".\\n'\n    inputs = prefix+\"\\n\".join(tokens)\n    targets = \"\\n\".join([':'.join(x) for x in zip(tokens,labels)])\n    return dict_of(inputs,targets)\n\ndef render_multiple_choice(prompt, options, labels):\n    inputs=(prompt+'\\n' if prompt else '')\n    letters = string.ascii_uppercase[:len(options)]\n    inputs=f'With no explanation, chose the best option from {render_options(letters)}. {inputs}'    \n    for letter, option in zip(letters, options):\n        inputs+=f'\\n{letter}: {option}'\n    targets = f'{letters[labels]}.'\n    return dict_of(inputs, targets) \n\ndef negative_sample_options(y, labels,N=4):\n    if len(labels)<N:\n        return labels\n    else:\n        return [y]+random.sample([x for x in labels if x!=y], N-1)\n\ndef shuffle_choices(x):\n    choices = sorted([k for k in x if 'choice' in k])\n    choices_texts = [x[c] for c in choices]\n    correct_choice =choices_texts[x['labels']]\n    random.shuffle(choices_texts)\n    for c, ct in zip(choices, choices_texts):\n        x[c]=ct\n    x[\"labels\"]=choices_texts.index(correct_choice)\n    return x\n\ndef recast_dataset_classification_to_mc(dataset,sep=\"[SEP]\",N=4):\n\n    def recast_split(d,N=N):\n        labels = d.features['labels']\n        df=d.to_pandas()\n        df['inputs'] = df.sentence1\n        if \"sentence2\" in df:\n            df['inputs'] +=sep + df.sentence2\n\n        N=min(N, len(labels.names))\n        df['choices']=df.apply(lambda x:negative_sample_options(labels.int2str(x['labels']), labels.names,N),axis=1)     \n        df['labels']=df.apply(lambda x:x['choices'].index(labels.int2str(x['labels'])),axis=1)\n\n        for i in range(N):\n            df[f'choice{i}']= \"This example is \" + df.choices.map(lambda x:x[i])\n\n        choices = [f'choice{i}' for i in range(N)]\n        return Dataset.from_pandas(df[['inputs',*choices,'labels']],preserve_index=False)\n\n    return DatasetDict({k: recast_split(v) for k,v in dataset.items()})\n\n\ndef recast_instruct(dataset):\n    features = dataset['train'].features\n    labels = features['labels']\n\n    if \"sentence1\" in features:\n        task_type='Classification'\n    if \"choice0\" in features:\n        task_type = \"MultipleChoice\"\n    if \"tokens\" in features:\n        task_type = \"TokenClassification\"\n\n    def recast_MultipleChoice(x):\n        x=shuffle_choices(x)\n        choices = sorted([k for k in x if 'choice' in k])\n        if all([x[c] in x['inputs'] for c in choices]):\n            return {\"inputs\":x['inputs'], 'targets': x[f\"choice{x['labels']}\"].strip()+\".\"}\n        else:\n            return render_multiple_choice(x['inputs'],[x[c] for c in choices],x['labels'])\n\n    def recast_TokenClassification(x):\n        distractors = list(labels.feature.names)\n        x_labels = [labels.feature.int2str(y) for y in x['labels']]\n        labels_set= list({labels.feature.int2str(y) for y in x['labels']})\n        options=list(dict.fromkeys(labels_set+distractors))[:max(len(labels_set),10)]\n        return render_token_classification(x['tokens'],options,x_labels)\n\n    def recast_Classification(x):\n        if 'sentence2' in x:\n            text=f\"text_A: {x['sentence1']}\\ntext_B: {x['sentence2']}\"\n        else:\n            text=x['sentence1']\n            \n        answer=labels.int2str(x['labels']).strip()\n        options= negative_sample_options(answer, labels._int2str)\n        return render_classification(text, options, answer)\n        \n    dataset = dataset.map(eval(f\"recast_{task_type}\"))\n    dataset = dataset.remove_columns([k for k in features if k not in ['inputs','targets']])\n    return dataset\n "
  },
  {
    "path": "src/tasksource/tasks.py",
    "content": "from .preprocess import cat, get, regen, name, constant, Classification, TokenClassification, MultipleChoice\nfrom .metadata import bigbench_discriminative_english, blimp_hard, imppres_presupposition, imppres_implicature, udep_en_configs, udep_en_labels\nfrom datasets import get_dataset_config_names, Sequence, ClassLabel, Dataset, DatasetDict\n\n# variable name: dataset___config__task\n\n###################### NLI/paraphrase ###############################\n\nglue___mnli = Classification(sentence1=\"premise\", sentence2=\"hypothesis\", labels=\"label\", splits=[\"train\", None, \"validation_matched\"])\nglue___qnli = Classification(\"question\",\"sentence\", labels=\"label\")\nglue___rte = Classification(sentence1=\"sentence1\", sentence2=\"sentence2\", labels=\"label\")\nglue___wnli = Classification(sentence1=\"sentence1\", sentence2=\"sentence2\", labels=\"label\")\n#glue___ax = Classification(sentence1=\"premise\", sentence2=\"hypothesis\", labels=\"label\", splits=[\"test\", None, None]) # fully masked\n\nglue___mrpc = Classification(sentence1=\"sentence1\", sentence2=\"sentence2\", labels=\"label\")\nglue___qqp = Classification(sentence1=\"question1\", sentence2=\"question2\", labels=\"label\")\nglue___stsb = Classification(sentence1=\"sentence1\", sentence2=\"sentence2\", labels=\"label\")\n\nsuper_glue___boolq = Classification(sentence1=\"question\", labels=\"label\")\nsuper_glue___cb = Classification(sentence1=\"premise\", sentence2=\"hypothesis\", labels=\"label\")\nsuper_glue___multirc = Classification(\n    cat([\"paragraph\", \"question\"]),\n    'answer',\n    labels='label'\n)\n#super_glue___rte = Classification(sentence1=\"premise\", sentence2=\"hypothesis\", labels=\"label\") # in glue\nsuper_glue___wic = Classification(\n    sentence1=cat([\"word\",\"sentence1\"], \" : \"),\n    sentence2=cat([\"word\",\"sentence2\"], \" : \"),\n    labels='label'\n)\nsuper_glue___axg = Classification(sentence1=\"premise\", sentence2=\"hypothesis\", labels=\"label\", splits=[\"test\", None, None])\n\n\nanli__a1 = Classification('premise','hypothesis','label', splits=['train_r1','dev_r1','test_r1'])\nanli__a2 = Classification('premise','hypothesis','label', splits=['train_r2','dev_r2','test_r2'])\nanli__a3 = Classification('premise','hypothesis','label', splits=['train_r3','dev_r3','test_r3'])\n\n\nbabi_nli = Classification(\"premise\", \"hypothesis\", \"label\",\n    dataset_name=\"tasksource/babi_nli\",\n    config_name=set(get_dataset_config_names(\"tasksource/babi_nli\"))-{\"agents-motivations\"}\n) # agents-motivations task is not as clear-cut as the others\n\n\nsick__label         = Classification('sentence_A','sentence_B','label')\nsick__relatedness   = Classification('sentence_A','sentence_B','relatedness_score')\nsick__entailment_AB = Classification('sentence_A','sentence_B','entailment_AB')\n#sick__entailment_BA = Classification('sentence_A','sentence_B','entailment_BA')\n\ndef remove_neg_1(dataset):\n    return dataset.filter(lambda x:x['labels']!=-1)\n\nsnli = Classification(sentence1=\"premise\", sentence2=\"hypothesis\", labels=\"label\",\n    post_process=remove_neg_1)\n\nscitail = Classification(\"sentence1\",\"sentence2\",\"gold_label\",config_name=\"snli_format\")\n\nhans = Classification(sentence1=\"premise\", sentence2=\"hypothesis\", labels=\"label\")\n\nwanli = Classification('premise','hypothesis','gold', dataset_name=\"alisawuffles/WANLI\")\n\nrecast_nli = Classification(sentence1=\"context\", sentence2=\"hypothesis\", labels=\"label\", dataset_name=\"tasksource/recast\",\n    config_name=['recast_kg_relations', 'recast_puns', 'recast_factuality', 'recast_verbnet',\n    'recast_verbcorner', 'recast_ner', 'recast_sentiment', 'recast_megaveridicality'])\n\n\nprobability_words_nli = Classification(sentence1=\"context\", sentence2=\"hypothesis\", labels=\"label\",\n    dataset_name=\"sileod/probability_words_nli\", \n    config_name=[\"reasoning_1hop\",\"reasoning_2hop\",\"usnli\"])\n\nnan_nli = Classification(\"premise\", \"hypothesis\", \"label\", dataset_name=\"joey234/nan-nli\")\n\nnli_fever = Classification(\"premise\",\"hypothesis\",\"label\",\n    dataset_name=\"pietrolesci/nli_fever\", splits=[\"train\",\"dev\",None])\n\nbreaking_nli = Classification(\"sentence1\",\"sentence2\",\"label\",\n    dataset_name=\"pietrolesci/breaking_nli\", splits=[\"full\",None,None])\n\nconj_nli = Classification(\"premise\",\"hypothesis\",\"label\",post_process=remove_neg_1,\n    dataset_name=\"pietrolesci/conj_nli\",splits=['train','dev',None])\n\nfracas = Classification(\"premise\",\"hypothesis\",\"label\",\n    dataset_name=\"pietrolesci/fracas\")\n\ndialogue_nli = Classification(\"sentence1\",\"sentence2\",\"label\",\n    dataset_name=\"pietrolesci/dialogue_nli\")   \n\nmpe_nli = Classification(\"premise\",\"hypothesis\",\"label\",\n    dataset_name=\"pietrolesci/mpe\",\n    splits=[\"train\",\"dev\",\"test\"])  \n\ndnc_nli = Classification(\"context\",\"hypothesis\",\"label\",\n    dataset_name=\"pietrolesci/dnc\")\n\n# gpt3_nli = Classification(\"text_a\",\"text_b\",\"label\",dataset_name=\"pietrolesci/gpt3_nli\") # not sound enough\n\nrecast_white__fnplus = Classification(\"text\",\"hypothesis\",\"label\",\n    dataset_name=\"pietrolesci/recast_white\",splits=['fnplus',None,None])\nrecast_white__sprl = Classification(\"text\",\"hypothesis\",\"label\",\n    dataset_name=\"pietrolesci/recast_white\",splits=['sprl',None,None])\nrecast_white__dpr = Classification(\"text\",\"hypothesis\",\"label\",\n    dataset_name=\"pietrolesci/recast_white\",splits=['dpr',None,None])\n\njoci = Classification(\"context\",\"hypothesis\",\n    labels=lambda x: [None, \"impossible\", \"technically possible\", \"plausible\", \"likely\", \"very likely\"][x[\"original_label\"]],\n    pre_process=lambda ds:ds.filter(lambda x:x['original_label']!=0),\n    dataset_name=\"pietrolesci/joci\",splits=['full',None,None])\n\n#enfever_nli = Classification(\"evidence\",\"claim\",\"label\", dataset_name=\"ctu-aic/enfever_nli\")\n\nrobust_nli__IS_CS = Classification(\"premise\",\"hypothesis\",\"label\",\n\tdataset_name=\"pietrolesci/robust_nli\", splits=[\"IS_CS\",None,None])\nrobust_nli__LI_LI = Classification(\"premise\",\"hypothesis\",\"label\",\n\tdataset_name=\"pietrolesci/robust_nli\", splits=[\"LI_LI\",None,None])\nrobust_nli__ST_WO = Classification(\"premise\",\"hypothesis\",\"label\",\n\tdataset_name=\"pietrolesci/robust_nli\", splits=[\"ST_WO\",None,None])\nrobust_nli__PI_SP = Classification(\"premise\",\"hypothesis\",\"label\",\n\tdataset_name=\"pietrolesci/robust_nli\", splits=[\"PI_SP\",None,None])\nrobust_nli__PI_CD = Classification(\"premise\",\"hypothesis\",\"label\",\n\tdataset_name=\"pietrolesci/robust_nli\", splits=[\"PI_CD\",None,None])\nrobust_nli__ST_SE = Classification(\"premise\",\"hypothesis\",\"label\",\n\tdataset_name=\"pietrolesci/robust_nli\", splits=[\"ST_SE\",None,None])\nrobust_nli__ST_NE = Classification(\"premise\",\"hypothesis\",\"label\",\n\tdataset_name=\"pietrolesci/robust_nli\", splits=[\"ST_NE\",None,None])\nrobust_nli__ST_LM = Classification(\"premise\",\"hypothesis\",\"label\",\n\tdataset_name=\"pietrolesci/robust_nli\", splits=[\"ST_LM\",None,None])\nrobust_nli_is_sd = Classification(\"premise\",\"hypothesis\",\"label\",\n    dataset_name=\"pietrolesci/robust_nli_is_sd\")\nrobust_nli_li_ts = Classification(\"premise\",\"hypothesis\",\"label\",\n    dataset_name=\"pietrolesci/robust_nli_li_ts\")\n\ngen_debiased_nli__snli_seq_z = Classification(\"premise\",\"hypothesis\",\"label\",\n\tdataset_name=\"pietrolesci/gen_debiased_nli\", splits=[\"snli_seq_z\",None,None])\ngen_debiased_nli__snli_z_aug = Classification(\"premise\",\"hypothesis\",\"label\",\n\tdataset_name=\"pietrolesci/gen_debiased_nli\", splits=[\"snli_z_aug\",None,None])\ngen_debiased_nli__snli_par_z = Classification(\"premise\",\"hypothesis\",\"label\",\n\tdataset_name=\"pietrolesci/gen_debiased_nli\", splits=[\"snli_par_z\",None,None])\ngen_debiased_nli__mnli_par_z = Classification(\"premise\",\"hypothesis\",\"label\",\n\tdataset_name=\"pietrolesci/gen_debiased_nli\", splits=[\"mnli_par_z\",None,None])\ngen_debiased_nli__mnli_z_aug = Classification(\"premise\",\"hypothesis\",\"label\",\n\tdataset_name=\"pietrolesci/gen_debiased_nli\", splits=[\"mnli_z_aug\",None,None])\ngen_debiased_nli__mnli_seq_z = Classification(\"premise\",\"hypothesis\",\"label\",\n\tdataset_name=\"pietrolesci/gen_debiased_nli\", splits=[\"mnli_seq_z\",None,None])\n\nadd_one_rte = Classification(\"premise\",\"hypothesis\",\"label\",\n    dataset_name=\"pietrolesci/add_one_rte\",splits=[\"train\",\"dev\",\"test\"])\n\ndef _imppres_post_process(ds,prefix=''):\n    # imppres entailment definition is either purely semantic or purely pragmatic\n    # because of that, we assign differentiate the labels from anli/mnli notation\n    return ds.cast_column('labels', ClassLabel(\n    names=[f'{prefix}_entailment',f'{prefix}_neutral',f'{prefix}_contradiction']))\n\nimppres__presupposition = imppres__prag = Classification(\"premise\",\"hypothesis\",\"gold_label\",\n    dataset_name=\"tasksource/imppres\", config_name=imppres_presupposition,\n    post_process=_imppres_post_process)\n\nimppres__prag = Classification(\"premise\",\"hypothesis\",\"gold_label_prag\",\n    dataset_name=\"tasksource/imppres\", config_name=imppres_implicature,\n    post_process=lambda x: _imppres_post_process(x,'pragmatic'))\n\nimppres__log = Classification(\"premise\",\"hypothesis\",\"gold_label_log\",\n    dataset_name=\"tasksource/imppres\", config_name=imppres_implicature,\n    post_process=lambda x: _imppres_post_process(x,'logical'))\n\n\n#glue__diagnostics = Classification(\"premise\",\"hypothesis\",\"label\",\n#    dataset_name=\"pietrolesci/glue_diagnostics\",splits=[\"test\",None,None])\n\nhlgd = Classification(\"headline_a\", \"headline_b\", labels=\"label\")\n\npaws___labeled_final   = Classification(\"sentence1\", \"sentence2\", name('label',['not_paraphrase','paraphrase']))\npaws___labeled_swap    = Classification(\"sentence1\", \"sentence2\", name('label',['not_paraphrase','paraphrase']), splits=[\"train\", None, None])\n#paws___unlabeled_final = Classification(\"sentence1\", \"sentence2\", \"label\")\n\n#quora = Classification(get.questions.text[0], get.questions.text[1], 'is_duplicate') # in glue\nmedical_questions_pairs = Classification(\"question_1\",\"question_2\", name(\"label\",['not similar','similar']))\n \n###################### Token Classification #########################\n\nconll2003__pos_tags   = TokenClassification(tokens=\"tokens\", labels='pos_tags')\nconll2003__chunk_tags = TokenClassification(tokens=\"tokens\", labels='chunk_tags')\nconll2003__ner_tags   = TokenClassification(tokens=\"tokens\", labels='ner_tags')\n\n#tner___tweebank_ner    = TokenClassification(tokens=\"tokens\", labels=\"tags\")\n\n######################## Multiple choice ###########################\n\n\nmodel_written_evals = MultipleChoice('question', choices=['answer_matching_behavior','answer_not_matching_behavior'], labels=constant(0),  \n    dataset_name=\"Anthropic/model-written-evals\")\n\ntruthful_qa___multiple_choice = MultipleChoice(\n    \"question\",\n    choices_list=get.mc1_targets.choices,\n    labels=constant(0)\n)\n\nfig_qa = MultipleChoice(\n    \"startphrase\",\n    choices=[\"ending1\",\"ending2\"],\n    labels=\"labels\",\n    dataset_name=\"nightingal3/fig-qa\",\n    splits=[\"train\",\"validation\",None]\n)\n\nbigbench = MultipleChoice(\n    'inputs',\n    choices_list='multiple_choice_targets',\n    labels=lambda x:x['multiple_choice_scores'].index(1) if 1 in ['multiple_choice_scores'] else -1,\n    dataset_name='tasksource/bigbench',\n    config_name=bigbench_discriminative_english - {\"social_i_qa\",\"intersect_geometry\"} # english multiple choice tasks, minus duplicates\n)\n#\"goal_step_wikihow\"\n\nblimp_hard = MultipleChoice(inputs=constant(''),\n    choices=['sentence_good','sentence_bad'],\n    labels=constant(0),\n    dataset_name=\"blimp\",\n    config_name=blimp_hard # tasks where GPT2 is at least 10% below  human accuracy\n)\n\ncos_e = MultipleChoice('question',\n    choices_list='choices',\n    labels= lambda x: x['choices_list'].index(x['answer']),\n    config_name='v1.0')\n\ncosmos_qa = MultipleChoice(cat(['context','question']),regen('answer[0-3]'),'label')\n\ndream = MultipleChoice(\n    lambda x:\"\\n\".join(x['dialogue']+[x['question']]),\n    choices_list='choice',\n    labels=lambda x:x['choices_list'].index(x['answer'])\n)\n\nopenbookqa = MultipleChoice(\n    'question_stem',\n    choices_list=get.choices.text,\n    labels='answerKey'\n)\n\nqasc = MultipleChoice(\n    'question',\n    choices_list=get.choices.text,\n    labels=lambda x: \"ABCDEFGH\".index(x['answerKey']),\n    splits=['train','validation',None]\n    \n)\n\nquartz = MultipleChoice(\n    'question',\n    choices_list=get.choices.text,\n    labels='answerKey'\n)\nquail = MultipleChoice(\n    cat(['context','question']),\n    choices_list='answers',\n    labels='correct_answer_id' \n)\n\nhead_qa___en = MultipleChoice(\"qtext\",\n    choices_list = lambda x:[a['atext'] for a in x[\"answers\"]],\n    labels = lambda x:[a['aid'] for a in x[\"answers\"]].index(x[\"ra\"])\n)\n\n\nsciq = MultipleChoice(\n    'question',\n    ['correct_answer']+regen('distractor[1-3]'),\n    labels=constant(0))\n\nsocial_i_qa = MultipleChoice(\n    'question',\n    ['answerA','answerB','answerC'],\n    'label')\n\nwiki_hop___original = MultipleChoice(\n    'question', \n    choices_list='candidates',\n    labels=lambda x:x['choices_list'].index(x[\"answer\"]))\n\nwiqa = MultipleChoice('question_stem',\n    choices_list = lambda x: x['choices']['text'],\n    labels='answer_label_as_choice')\n\npiqa = MultipleChoice('goal', choices=['sol1','sol2'], labels='label')\n\nhellaswag = MultipleChoice('ctx_a',\n    choices_list=lambda x: [f'{x[\"ctx_b\"]}{e}' for e in x[\"endings\"]],\n    labels='label', splits=['train','validation',None])\n\nsuper_glue___copa = MultipleChoice('premise',['choice1','choice2'],'label')\n\nbalanced_copa = MultipleChoice('premise',['choice1','choice2'],'label',\n    dataset_name=\"pkavumba/balanced-copa\")\n\ne_care = MultipleChoice('premise',['choice1','choice2'],'label',\n    dataset_name=\"12ml/e-CARE\")\n\nart = MultipleChoice(cat(['hypothesis_1','hypothesis_2']),\n    ['observation_1','observation_2'],\n    labels=lambda x:x['label']-1,\n    splits=['train','validation',None]\n)\n\n\nmmlu = MultipleChoice('question',labels='answer',choices_list='choices',splits=['validation','dev','test'],\n    dataset_name=\"tasksource/mmlu\",\n    config_name=get_dataset_config_names(\"tasksource/mmlu\")\n)\n\nwinogrande = MultipleChoice('sentence',['option1','option2'],'answer',config_name='winogrande_xl',\n    splits=['train','validation',None])\n\ncodah = MultipleChoice('question_propmt',choices_list='candidate_answers',labels='correct_answer_idx',config_name='codah')\n\nai2_arc__challenge = MultipleChoice('question',\n    choices_list=get.choices.text,  \n    labels=lambda x: get.choices.label(x).index(x[\"answerKey\"]),\n    config_name=[\"ARC-Challenge\",\"ARC-Easy\"])\n\ndefinite_pronoun_resolution = MultipleChoice(\n    inputs=cat([\"sentence\",\"pronoun\"],' : '),\n    choices_list='candidates',\n    labels=\"label\",\n    splits=['train',None,'test'])\n\nswag___regular=MultipleChoice(cat([\"sent1\",\"sent2\"]),regen(\"ending[0-3]\"),\"label\")\n\ndef _split_choices(s):\n    import re\n    return [x.rstrip(', ') for x in re.split(r'[a-e] \\) (.*?)',s) if x.strip(', ')]\n\nmath_qa = MultipleChoice(\n    'Problem', \n    choices_list = lambda x: _split_choices(x['options']),\n    labels = lambda x:'abcde'.index(x['correct'])   \n)\n\n#aqua_rat___tokenized = MultipleChoice(\"question\",choices_list=\"options\",labels=lambda x:\"ABCDE\".index(x['correct'])) in math_qa\n\n\n######################## Classification (other) ########################\nglue___cola = Classification(sentence1=\"sentence\", labels=\"label\")\nglue___sst2 = Classification(sentence1=\"sentence\", labels=\"label\")\n\nutilitarianism = Classification(\"comparison\",labels=\"label\",\ndataset_name=\"metaeval/utilitarianism\")\n\namazon_counterfactual = Classification(\n    \"text\", labels=\"label\",\n    dataset_name=\"mteb/amazon_counterfactual\",\n    config_name=\"en\")\n\ninsincere_questions = Classification(\n    \"text\", labels=\"label_text\",\n    dataset_name=\"SetFit/insincere-questions\")\n\ntoxic_conversations = Classification(\n    \"text\", labels=\"label\",\n    dataset_name=\"SetFit/toxic_conversations\")\n\nturingbench = Classification(\"Generation\",labels=\"label\",\n    dataset_name=\"turingbench/TuringBench\",\n    splits=[\"train\",\"validation\",None])\n\n\ntrec = Classification(sentence1=\"text\", labels=\"fine_label\")\n\ntals_vitaminc = Classification('claim','evidence','label', dataset_name=\"tals/vitaminc\")\n\nhope_edi = Classification(\"text\", labels=\"label\", splits=[\"train\", \"validation\", None], config_name=[\"english\"])\n\n#fever___v1_0 = Classification(sentence1=\"claim\", labels=\"label\", splits=[\"train\", \"paper_dev\", \"paper_test\"], dataset_name=\"fever\", config_name=\"v1.0\")\n#fever___v2_0 = Classification(sentence1=\"claim\", labels=\"label\", splits=[None, \"validation\", None], dataset_name=\"fever\", config_name=\"v2.0\")\n\nrumoureval_2019 = Classification(\n    sentence1=\"source_text\",\n    sentence2=lambda x: str(x[\"reply_text\"]),\n    labels=\"label\", dataset_name=\"strombergnlp/rumoureval_2019\", config_name=\"RumourEval2019\",\n    post_process=lambda ds:ds.filter(lambda x:x['labels']!=None)    \n)\n\nethos___binary = Classification(sentence1=\"text\", labels=\"label\", splits=[\"train\", None, None])\nethos___multilabel = Classification(\n    'text',\n    labels=lambda x: [x[c] for c in\n    ['violence', 'gender', 'race', 'national_origin', 'disability', 'religion', 'sexual_orientation','directed_vs_generalized']\n    ],\n    splits=[\"train\", None, None]\n)\n\ntweet_eval = Classification(sentence1=\"text\", labels=\"label\",\n    config_name=[\"emoji\", \"emotion\", \"hate\", \"irony\", \"offensive\", \"sentiment\"])\n\ndef stance_kwargs(topic):\n    return {\n        \"sentence1\": constant(f'Topic: {topic}. \\n Opinion:\\n'), \n        \"sentence2\": \"text\", \n        \"labels\": \"label\", \n        \"config_name\": f\"stance_{topic.lower()}\",\n        \"dataset_name\": \"tweet_eval\"\n    }\n\ntweet_eval_abortion = Classification(**stance_kwargs(\"abortion\"))\ntweet_eval_atheism  = Classification(**stance_kwargs(\"atheism\"))\ntweet_eval_climate  = Classification(**stance_kwargs(\"climate\"))\ntweet_eval_feminist = Classification(**stance_kwargs(\"feminist\"))\ntweet_eval_hillary  = Classification(**stance_kwargs(\"Hillary\"))\n\n\ndiscovery = Classification(\"sentence1\", \"sentence2\", labels=\"label\", config_name=[\"discovery\"])\n\npragmeval_1 = Classification(\"sentence\",labels=\"label\",\n    dataset_name=\"pragmeval\",\n    config_name= [\"emobank-arousal\", \"emobank-dominance\", \"emobank-valence\", \"squinky-formality\", \"squinky-implicature\", \n    \"squinky-informativeness\",\"switchboard\",\"mrda\",\"verifiability\"])\n\npragmeval_2 = Classification(\"sentence1\",\"sentence2\",labels=\"label\",\n    dataset_name=\"pragmeval\",\n    config_name= [\"emergent\", \"gum\", \"pdtb\", \"persuasiveness-claimtype\", \n    \"persuasiveness-eloquence\", \"persuasiveness-premisetype\", \"persuasiveness-relevance\", \"persuasiveness-specificity\", \n    \"persuasiveness-strength\", \"sarcasm\",\"stac\"])\n\nsilicone = Classification(\"Utterance\",labels=\"Label\",\n    config_name=['dyda_da', 'dyda_e', 'iemocap', 'maptask', 'meld_e', 'meld_s', 'oasis', 'sem'] # +['swda', 'mrda'] # in pragmeval\n)\n\nlex_glue___eurlex = Classification(sentence1=\"text\", labels=\"labels\") \nlex_glue___scotus = Classification(sentence1=\"text\", labels=\"label\")\nlex_glue___ledgar = Classification(sentence1=\"text\", labels=\"label\")\nlex_glue___unfair_tos = Classification(sentence1=\"text\", labels=\"labels\")\nlex_glue___case_hold = MultipleChoice(\"context\", choices_list='endings', labels=\"label\")\n\nlanguage_identification = Classification(\"text\",labels=\"labels\", dataset_name=\"papluca/language-identification\")\n\n################ Automatically generated (verified)##########\n\nimdb = Classification(sentence1=\"text\", labels=\"label\", splits=[\"train\", None, \"test\"])\n\nrotten_tomatoes = Classification(sentence1=\"text\", labels=\"label\")\n\nag_news = Classification(sentence1=\"text\", labels=\"label\", splits=[\"train\", None, \"test\"])\n\nyelp_review_full = Classification(sentence1=\"text\", labels=\"label\", splits=[\"train\", None, \"test\"], config_name=[\"yelp_review_full\"])\n\nfinancial_phrasebank = Classification(sentence1=\"sentence\", labels=\"label\", splits=[\"train\", None, None],\n    config_name=[\"sentences_allagree\"])\n\npoem_sentiment = Classification(sentence1=\"verse_text\", labels=\"label\")\n\n#emotion = Classification(sentence1=\"text\", labels=\"label\") # file not found\n\ndbpedia_14 = Classification(sentence1=\"content\", labels=\"label\", splits=[\"train\", None, \"test\"], config_name=[\"dbpedia_14\"])\n\namazon_polarity = Classification(sentence1=\"content\", labels=\"label\", splits=[\"train\", None, \"test\"], config_name=[\"amazon_polarity\"])\n\napp_reviews = Classification(\"review\", labels=\"star\", splits=[\"train\", None, None])\n\n# multi_nli = Classification(sentence1=\"premise\", sentence2=\"hypothesis\", labels=\"label\", splits=[\"train\", \"validation_matched\", None]) #glue\n\nhate_speech18 = Classification(sentence1=\"text\", labels=\"label\", splits=[\"train\", None, None])\n\nsms_spam = Classification(sentence1=\"sms\", labels=\"label\", splits=[\"train\", None, None])\n\nhumicroedit___subtask_1 = Classification(\"original\", \"edit\", labels=\"meanGrade\", dataset_name=\"humicroedit\", config_name=\"subtask-1\")\nhumicroedit___subtask_2 = Classification(\n    sentence1=cat(['original1','edit1'],' : '),\n    sentence2=cat(['original2','edit2'],' : '),\n    labels=\"label\", dataset_name=\"humicroedit\", config_name=\"subtask-2\")\n\nsnips_built_in_intents = Classification(sentence1=\"text\", labels=\"label\", splits=[\"train\", None, None])\n\nbanking77 = Classification(sentence1=\"text\", labels=\"label\", splits=[\"train\", None, \"test\"])\n\nhate_speech_offensive = Classification(sentence1=\"tweet\", labels=\"class\", splits=[\"train\", None, None])\n\nyahoo_answers_topics = Classification(\n    \"question_title\",\"question_content\",labels=\"topic\")\n\nstackoverflow_questions=Classification(\"title\",\"body\",labels=\"label\",\n    dataset_name=\"pacovaldez/stackoverflow-questions\")\n\n#hyperpartisan_news_detection___byarticle = Classification(sentence1=\"text\", labels=\"hyperpartisan\", splits=[\"train\", None, None]) # files too heavy\n#hyperpartisan_news_detection___bypublisher = Classification(sentence1=\"text\", labels=\"hyperpartisan\", splits=[\"train\",\"validation\", None]) # files too heavy\n\nhyperpartisan_news = Classification(\n    \"text\",\n    labels=lambda x: {'true':'hyperpartisan','false':'not_hyperpartisan'}.get(x[\"label\"]),\n    dataset_name=\"zapsdcn/hyperpartisan_news\")\n\nscierc = Classification(\"text\",labels=\"label\",dataset_name=\"zapsdcn/sciie\")\ncitation_intent = Classification(\"text\",labels=\"label\",dataset_name=\"zapsdcn/citation_intent\")\n\n#go_emotions___raw = Classification(sentence1=\"text\", splits=[\"train\", None, None])\ngo_emotions___simplified = Classification(sentence1=\"text\", labels=\"labels\")\n\n#boolq = Classification(sentence1=\"question\", splits=[\"train\", \"validation\", None]) # in superglue\n\n#ecthr_cases___alleged_violation_prediction = Classification(labels=\"labels\", dataset_name=\"ecthr_cases\", config_name=\"alleged-violation-prediction\")\n#ecthr_cases___violation_prediction = Classification(labels=\"labels\", dataset_name=\"ecthr_cases\", config_name=\"violation-prediction\")\n#   too long\n\nscicite = Classification(sentence1=\"string\", labels=\"label\",dataset_name=\"allenai/scicite\")\n\nliar = Classification(sentence1=\"statement\", labels=\"label\")\n\nrelbert_lexical_relation_classification = Classification(sentence1=\"head\", sentence2=\"tail\", labels=\"relation\",\n dataset_name=\"relbert/lexical_relation_classification\",\n config_name=[\"BLESS\",\"CogALexV\",\"EVALution\",\"K&H+N\",\"ROOT09\"])\n\n\nlinguisticprobing = Classification(\"sentence\", labels=\"label\", dataset_name=\"tasksource/linguisticprobing\", \n    config_name=['subj_number',\n                'obj_number',\n                'past_present',\n                'sentence_length',\n                'top_constituents',\n                'tree_depth',\n                'coordination_inversion',\n                'odd_man_out',\n                'bigram_shift']#+['word_content'] #too many labels \n)\n\ncrowdflower = Classification(\"text\", labels=\"label\",\n splits=[\"train\", None, None], dataset_name=\"tasksource/crowdflower\",\n config_name=['sentiment_nuclear_power',\n            'tweet_global_warming',\n            'airline-sentiment',\n            'corporate-messaging',\n            'economic-news',\n            'political-media-audience',\n            'political-media-bias',\n            'political-media-message',\n            'text_emotion']\n)\n\nethics___commonsense = Classification(sentence1=\"text\", labels=\"label\", dataset_name=\"metaeval/ethics\", config_name=\"commonsense\")\nethics___deontology = Classification(sentence1=\"text\", labels=\"label\", dataset_name=\"metaeval/ethics\", config_name=\"deontology\")\nethics___justice = Classification(sentence1=\"text\", labels=\"label\", dataset_name=\"metaeval/ethics\", config_name=\"justice\")\nethics___virtue = Classification(sentence1=\"sentence1\", sentence2=\"sentence2\", labels=\"label\", dataset_name=\"metaeval/ethics\", config_name=\"virtue\")\n\nemo = Classification(sentence1=\"text\", labels=\"label\", splits=[\"train\", None, \"test\"], config_name=[\"emo2019\"])\n\ngoogle_wellformed_query = Classification(sentence1=\"content\", labels=\"rating\")\n\ntweets_hate_speech_detection = Classification(sentence1=\"tweet\", labels=\"label\", splits=[\"train\", None, None])\n\n#adv_glue___adv_sst2 = Classification(sentence1=\"sentence\", labels=\"label\", splits=[\"validation\", None, None])\n#adv_glue___adv_qqp = Classification(sentence1=\"question1\", sentence2=\"question2\", labels=\"label\", splits=[\"validation\", None, None])\n#adv_glue___adv_mnli = Classification(sentence1=\"premise\", sentence2=\"hypothesis\", labels=\"label\", splits=[\"validation\", None, None])\n#adv_glue___adv_mnli_mismatched = Classification(sentence1=\"premise\", sentence2=\"hypothesis\", labels=\"label\", splits=[\"validation\", None, None])\n#adv_glue___adv_qnli = Classification(sentence1=\"question\", labels=\"label\", splits=[\"validation\", None, None])\n#adv_glue___adv_rte = Classification(sentence1=\"sentence1\", sentence2=\"sentence2\", labels=\"label\", splits=[\"validation\", None, None])\n\nhas_part = Classification(\"arg1\",\"arg2\", labels=\"score\", splits=[\"train\", None, None])\n\nwnut_17 = TokenClassification(tokens=\"tokens\", labels=\"ner_tags\", config_name=[\"wnut_17\"])\n\nncbi_disease = TokenClassification(tokens=\"tokens\", labels=\"ner_tags\", config_name=[\"ncbi_disease\"])\n\nacronym_identification = TokenClassification(labels=\"labels\", tokens=\"tokens\")\n\njnlpba = TokenClassification(tokens=\"tokens\", labels=\"ner_tags\", splits=[\"train\", \"validation\", None], config_name=[\"jnlpba\"])\n\n#species_800 = TokenClassification(tokens=\"tokens\", labels=\"ner_tags\", config_name=[\"species_800\"]) missing files\n\nSpeedOfMagic_ontonotes_english = TokenClassification(tokens=\"tokens\", labels=\"ner_tags\", dataset_name=\"SpeedOfMagic/ontonotes_english\", config_name=\"SpeedOfMagic--ontonotes_english\")\n\nblog_authorship_corpus__gender    = Classification(sentence1=\"text\",labels=\"gender\")\nblog_authorship_corpus__age       = Classification(sentence1=\"text\",labels=\"age\")\n#blog_authorship_corpus__horoscope = Classification(sentence1=\"text\",labels=\"horoscope\")\nblog_authorship_corpus__job       = Classification(sentence1=\"text\",labels=\"job\")\n\nlaunch_open_question_type = Classification(sentence1=\"question\", labels=\"resolve_type\", dataset_name=\"launch/open_question_type\")\n\nhealth_fact = Classification(sentence1=\"claim\", labels=\"label\",\n    pre_process = lambda ds:ds.filter(lambda x:x['label'] not in {-1})\n)\n\ncommonsense_qa = MultipleChoice(\n    \"question\",\n    choices_list=get.choices.text,\n    labels=lambda x: \"ABCDE\".index(x[\"answerKey\"]),\n    splits=[\"train\",\"validation\",None]\n)\nmc_taco = Classification(\n    lambda x: f'{x[\"sentence\"]} {x[\"question\"]} {x[\"answer\"]}',\n    labels=\"label\",\n    splits=[ \"validation\",None,\"test\"]\n)\n\nade_corpus_v2___Ade_corpus_v2_classification = Classification(\"text\",labels=\"label\")\n\ndiscosense = MultipleChoice(\"context\",choices=regen(\"option\\_[0-3]\"),labels=\"label\",\n    dataset_name=\"prajjwal1/discosense\")\n    \ncirca = Classification(\n    sentence1=cat([\"context\",\"question-X\"]),\n    sentence2=\"answer-Y\",\n    labels=\"goldstandard2\", post_process=remove_neg_1)\n\n#code_x_glue_cc_defect_detection = Classification(\"func\", labels=\"target\")\n\n#code_x_glue_cc_clone_detection_big_clone_bench = Classification(\"func1\", \"func2\", \"label\") # in bigbench + too heavy (100g)\n\n#code_x_glue_cc_code_refinement = MultipleChoice(\n#    constant(\"\"), choices=[\"buggy\",\"fixed\"], labels=constant(0),\n#    config_name=\"medium\")\n\n#effective_feedback_student_writing = Classification(\"discourse_text\", \n#labels=\"discourse_effectiveness\",dataset_name=\"YaHi/EffectiveFeedbackStudentWriting\")\n# discontinued /!\\\n\n#promptSentiment = Classification(\"text\",labels=\"label\",dataset_name=\"Ericwang/promptSentiment\")\n#promptNLI = Classification(\"premise\",\"hypothesis\",labels=\"label\",dataset_name=\"Ericwang/promptNLI\")\n#promptSpoke = Classification(\"text\",labels=\"label\",dataset_name=\"Ericwang/promptSpoke\")\n#promptProficiency = Classification(\"text\",labels=\"label\",dataset_name=\"Ericwang/promptProficiency\")\n#promptGrammar = Classification(\"text\",labels=\"label\",dataset_name=\"Ericwang/promptGrammar\")\n#promptCoherence = Classification(\"text\",labels=\"label\",dataset_name=\"Ericwang/promptCoherence\")\n\nphrase_similarity = Classification(\n    sentence1=cat([\"phrase1\",\"sentence1\"], \" : \"),\n    sentence2=cat([\"phrase2\",\"sentence2\"], \" : \"),\n    labels='label',\n    dataset_name=\"PiC/phrase_similarity\"\n)\n\nexaggeration_detection = Classification(\n    sentence1=\"press_release_conclusion\",\n    sentence2=\"abstract_conclusion\",\n    labels=\"exaggeration_label\", \n    dataset_name=\"copenlu/scientific-exaggeration-detection\"\n)\nquarel = Classification(\n    \"question\",\n    labels=lambda x: \"AB\"[x[\"answer_index\"]]\n)\n\nmwong_fever_evidence_related = Classification(sentence1=\"claim\", sentence2=\"evidence\", labels=name(\"labels\",['unrelated','related']),\n    splits=[\"train\", \"valid\", \"test\"], dataset_name=\"mwong/fever-evidence-related\")\n\nnumer_sense = Classification(\"sentence\",labels=\"target\",splits=[\"train\",None,None])\n\ndynasent__r1 = Classification(\"sentence\", labels=\"gold_label\", \n    dataset_name=\"dynabench/dynasent\", config_name=\"dynabench.dynasent.r1.all\")\ndynasent__r2 = Classification(\"sentence\", labels=\"gold_label\", \n    dataset_name=\"dynabench/dynasent\", config_name=\"dynabench.dynasent.r2.all\")\n\nsarcasm_news = Classification(\"headline\", labels=\"is_sarcastic\",\n    dataset_name=\"raquiba/Sarcasm_News_Headline\")\n\nsem_eval_2010_task_8 = Classification(\"sentence\",labels=\"relation\")\n\nauditor_review = Classification(sentence1=\"sentence\",\n    labels=name(\"label\",['negative','neutral','positive']),\n    dataset_name=\"demo-org/auditor_review\")\n\nmedmcqa = MultipleChoice(\"question\", choices=regen('op[a-d]'),labels='cop')\n\n\ndynasent_disagreement    = Classification(\"text\", labels=\"binary_disagreement\", dataset_name=\"RuyuanWan/Dynasent_Disagreement\")\npoliteness_disagreement  = Classification(\"text\", labels=\"binary_disagreement\", dataset_name=\"RuyuanWan/Politeness_Disagreement\")\nsbic_disagreement        = Classification(\"text\", labels=\"binary_disagreement\", dataset_name=\"RuyuanWan/SBIC_Disagreement\")\nschem_disagreement       = Classification(\"text\", labels=\"binary_disagreement\", dataset_name=\"RuyuanWan/SChem_Disagreement\")\ndilemmas_disagreement    = Classification(\"text\", labels=\"binary_disagreement\", dataset_name=\"RuyuanWan/Dilemmas_Disagreement\")\n\nlogiqa = MultipleChoice(\n    cat([\"context\",\"query\"]),\n    choices_list = 'options',\n    labels = \"correct_option\",\n    dataset_name=\"lucasmccabe/logiqa\"\n)\n\n#proto_qa = MultipleChoice(\n#    \"question\",\n#    choices_list=lambda x:x['answer-clusters']['answers'],\n#    labels=lambda x: x['answer-clusters']['count'].index(max(x['answer-clusters']['count'])),\n#    config_name='proto_qa'\n#)\n\nwiki_qa = Classification(\"question\",\"answer\", name(\"label\",['False','True']))\n\ncycic_classification = Classification(\"question\",labels=name(\"correct_answer\",['False','True']),\n    dataset_name = \"tasksource/cycic_classification\")\ncycic_mc = MultipleChoice(\"question\", choices=regen('answer\\_option[0-4]'), labels=\"correct_answer\",\n    dataset_name = \"tasksource/cycic_multiplechoice\")\n\n\ndef _preprocess_chatgpt_detection(ex):\n    import random\n    label=random.random()<0.5\n    ex['label']=int(label)\n    ex['answer']=[str(ex['human_answers'][0]),str(ex['chatgpt_answers'][0])][label]\n    return ex\n\n#chatgpt_detection = Classification(\"question\",\"answer\",\"label\",\n#    dataset_name = 'Hello-SimpleAI/HC3', config_name=\"all\",\n#    pre_process=lambda dataset:dataset.map(_preprocess_chatgpt_detection))\n\nsts_companion = Classification(\"sentence1\",\"sentence2\",\"label\",\n    dataset_name=\"tasksource/sts-companion\")\n\ncommonsense_qa_2 = Classification(\"question\",labels=\"answer\",\n    dataset_name=\"tasksource/commonsense_qa_2.0\")\n\nling_nli = Classification(\"premise\",\"hypothesis\",\"label\",dataset_name=\"tasksource/lingnli\")\n\nmonotonicity_entailment = Classification(\"sentence1\", \"sentence2\", \"gold_label\",    \n    dataset_name=\"tasksource/monotonicity-entailment\")\n\narct = MultipleChoice(cat([\"reason\",\"claim\"]),choices=[\"warrant0\",\"warrant1\"],\n    labels=\"correctLabelW0orW1\", dataset_name=\"tasksource/arct\")\n\nscinli = Classification(\"sentence1\", \"sentence2\", labels=\"label\",\n    post_process=lambda x:x.shuffle(seed=0),\n    dataset_name=\"tasksource/scinli\")\n\nnaturallogic = Classification(\" sent1 \",\" sent2 \",\" new_label \",dataset_name=\"tasksource/naturallogic\")\n\nonestop_qa = MultipleChoice(cat([\"paragraph\",\"question\"]),choices_list=\"answers\",\n    labels=constant(0))\n\nmoral_stories = MultipleChoice(cat([\"situation\",\"intention\"]),\n    choices=['moral_action',\"immoral_action\"],labels=constant(0),\n    dataset_name=\"demelin/moral_stories\", config_name=\"full\")\n\nprost = MultipleChoice(cat([\"context\",\"ex_question\"]), choices=['A','B','C','D'],labels=\"label\",\n    dataset_name=\"corypaik/prost\")\n\ndyna_hate = Classification(\"text\",labels=\"label\",dataset_name=\"aps/dynahate\",splits=['train',None,None])\n\nsyntactic_augmentation_nli = Classification('sentence1',\"sentence2\",\"gold_label\",dataset_name=\"metaeval/syntactic-augmentation-nli\")\n\nautotnli = Classification(\"premises\", \"hypothesis\", \"label\", dataset_name=\"tasksource/autotnli\")\n#equate = Classification(\"sentence1\", \"sentence2\", \"gold_label\",dataset_name=\"metaeval/equate\")\n\nconqada = Classification(\"sentence1\",\"sentence2\",\"label\",dataset_name=\"lasha-nlp/CONDAQA\",\n    pre_process = lambda ds:ds.filter(lambda x:x['label'] in {\"DON'T KNOW\",\"YES\",\"NO\"})\n)\n\nwebgbpt_comparisons = MultipleChoice(get.question.full_text, choices=['answer_0','answer_1'],\n    labels=lambda x:int(x['score_1']>0),\n    dataset_name=\"openai/webgpt_comparisons\")\n\nsynthetic_instruct = MultipleChoice('prompt', choices=['chosen', 'rejected'],\n    labels=constant(0), dataset_name=\"Dahoas/synthetic-instruct-gptj-pairwise\")\n\nscruples = Classification(\"text\",labels=\"binarized_label\",dataset_name=\"metaeval/scruples\")\n\nwouldyourather = MultipleChoice(constant('Most people would rather:'), choices=['option_a','option_b'],\n    labels= lambda x: int(x['votes_a']<x['votes_b']),\n    dataset_name=\"metaeval/wouldyourather\")\n\n#attempto_nli = Classification(\"premise\",\"hypothesis\",\n#    lambda x:f'race-{x[\"race_label\"]}',\n#    dataset_name=\"sileod/attempto-nli\")\n\ndefeasible_nli = Classification(cat([\"Premise\",\"Hypothesis\"]),\"Update\",labels=\"UpdateType\",\n    dataset_name=\"metaeval/defeasible-nli\",config_name=['atomic', 'snli'])\n\n#defeasible_nli_social = Classification(cat([\"SocialChemROT\",\"Hypothesis\"]),\"Update\",labels=\"UpdateType\",\n#    dataset_name=\"metaeval/defeasible-nli\",config_name='social')\n\nhelp_nli = Classification(\"ori_sentence\",\"new_sentence\",\"gold_label\",\n    dataset_name=\"tasksource/help-nli\")\n    \nnli_veridicality_transitivity = Classification(\"sentence1\",\"sentence2\",\"gold_label\",\n    dataset_name=\"metaeval/nli-veridicality-transitivity\")\n\nlonli = Classification(\"premise\",\"hypothesis\",\"label\",\n    dataset_name=\"tasksource/lonli\")\n\ndadc_limit = Classification(\"sentence1\",\"sentence2\",\"label\",\n    dataset_name=\"tasksource/dadc-limit-nli\")\n\nflute = Classification(\"premise\",\"hypothesis\",\"label\",\n    dataset_name=\"ColumbiaNLP/FLUTE\")\n\nstrategy_qa = Classification('question',labels='answer',\n    dataset_name=\"tasksource/strategy-qa\",splits=['train',None,None])\n\nsummarize_from_feedback = MultipleChoice(get.info.post,\n    choices_list=lambda x: [x['summaries'][0]['text'],x['summaries'][1]['text']],\n    labels=\"choice\",\n    dataset_name=\"openai/summarize_from_feedback\", config_name=\"comparisons\",\n    pre_process = lambda ds:ds.filter(lambda x: type(get.info.post(x))==str)\n)\n\nfolio = Classification(\"premises\",\"conclusion\",\n    labels=lambda x:{'False':'contradiction','True':'entailment', 'Uncertain':'neutral'}.get(x[\"label\"]),\n    dataset_name=\"tasksource/folio\")\n\ntomi_nli = Classification(\"premise\",\"hypothesis\",\"label\",\n    dataset_name=\"tasksource/tomi-nli\")\n\navicenna = Classification(\"Premise 1\",\"Premise 2\",\"Syllogistic relation\",\n    dataset_name=\"tasksource/avicenna\")\n\nshp = MultipleChoice(\"history\",\n    choices=['human_ref_A','human_ref_B'],\n    labels=\"labels\",\n    dataset_name=\"stanfordnlp/SHP\")\n\nmedqa_usmle = MultipleChoice('sent1',choices=regen('ending[0-3]'),labels='label',\n    dataset_name=\"GBaker/MedQA-USMLE-4-options-hf\")\n\nwikimedqa = MultipleChoice(\"text\",choices=regen('option\\_[0-7]'),labels='label',\n    dataset_name=\"sileod/wikimedqa\",\n    config_name=[\"medwiki\"])\n\ncicero = MultipleChoice(lambda x: \" \".join(x['Dialogue']),\n    choices_list=\"Choices\", labels=lambda x:x['Human Written Answer'][0],\n    dataset_name=\"declare-lab/cicero\")\n\ncreak = Classification(\"sentence\",labels=\"label\",\n    dataset_name='amydeng2000/CREAK')\n\nmutual = MultipleChoice(\"article\",choices_list=\"options\",\n    labels=lambda x: \"ABCD\".index(x['answers']),\n    dataset_name=\"tasksource/mutual\",splits=[\"train\",None,None])\n\nneqa = MultipleChoice('prompt',choices_list='classes',labels=\"answer_index\",\n    dataset_name=\"inverse-scaling/NeQA\")\nquote_repetition = MultipleChoice('prompt',choices_list='classes',labels=\"answer_index\",\n    dataset_name=\"inverse-scaling/quote-repetition\")\nredefine_math = MultipleChoice('prompt',choices_list='classes',labels=\"answer_index\",\n    dataset_name=\"inverse-scaling/redefine-math\")\n\npuzzte = Classification(\"puzzle_text\",\"question\",\"answer\",\n    dataset_name=\"tasksource/puzzte\")\n\nimplicatures = MultipleChoice(cat(['context','response'],\"\\n\"),\n    choices=['correct_implicature','incorrect_implicature'],\n    labels=constant(0),\n    dataset_name='tasksource/implicatures')\n\nrace = MultipleChoice(cat(['question','article'],'\\n'), choices_list='options',\n    labels=lambda x:'ABCDE'.index(x['answer']),\n    config_name=['middle','high'])\n\nrace_c = MultipleChoice(cat(['question','article'],'\\n'),choices_list='option',labels='label',\n    dataset_name='tasksource/race-c')\n\nspartqa_yn=Classification(\"story\",\"question\",\"answer\",\n    dataset_name=\"tasksource/spartqa-yn\")\n\nspartqa_mc=MultipleChoice(cat([\"story\",\"question\"]),choices_list=\"candidate_answers\",labels=\"answer\",\n    dataset_name=\"tasksource/spartqa-mchoice\")\n\ntemporal_nli = Classification(\"Premise\",\"Hypothesis\",\"Label\",\n    dataset_name=\"tasksource/temporal-nli\")\n\nriddle_sense = MultipleChoice(\"question\", choices_list=get.choices.text, \n    labels=lambda x : \"ABCDE\".index(x['answerKey']))\n\nclcd = Classification(\n    \"sentence1\",\"sentence2\",\"label\",\n    dataset_name=\"tasksource/clcd-english\")\n\ntwentyquestions = Classification(\"question\",\"subject\",\"answer\",dataset_name=\"maximedb/twentyquestions\")\n\nreclor = MultipleChoice(cat([\"context\",\"question\"]),choices_list=\"answers\",labels=\"label\",\n    dataset_name=\"metaeval/reclor\",splits=['train','validation',None])\n\nc_aug_imdb = Classification(\"Text\",labels=\"Sentiment\",\n    dataset_name='tasksource/counterfactually-augmented-imdb')\n\nc_aug_snli = Classification(\"sentence1\",\"sentence2\",\"gold_label\",\n    dataset_name='tasksource/counterfactually-augmented-snli')\n\ncnli = Classification(\"premise\",\"hypothesis\",\"label\",\n    dataset_name='metaeval/cnli')\n\nperturbed_boolq = Classification(\"question\",labels=\"hard_label\",\n    dataset_name='tasksource/boolq-natural-perturbations')\n\n#mega_acceptability = Classification(\"sentence\",labels=\"average\",\n#    dataset_name='metaeval/mega-acceptability-v2')\n\ngraded_acceptability = Classification(\"text\",labels=\"normalized_score\",\n    dataset_name=\"metaeval/acceptability-prediction\")\n\nequate = Classification(\"sentence1\",\"sentence2\",\"gold_label\",\n    dataset_name='metaeval/equate')\n\nscience_qa = MultipleChoice(\"question\",choices_list=\"choices\",labels=\"answer\",\n    dataset_name=\"tasksource/ScienceQA_text_only\")\n\nekar=MultipleChoice(\"question\",choices_list=get.choices.text,\n    labels=lambda x:\"ABCD\".index(x['answerKey']),\ndataset_name=\"Jiangjie/ekar_english\")\n\nimplicit_hate = Classification(\"post\",labels=\"class\",\n    dataset_name=\"tasksource/implicit-hate-stg1\")\n\nnli_unambiguity = Classification(\"premise\",\"hypothesis\",\"gini\",\n    dataset_name=\"metaeval/chaos-mnli-ambiguity\")\n\nheadline_cause = Classification('left_title','right_title','label',\n    dataset_name='IlyaGusev/headline_cause',config_name='en_simple')\n\nlogiqa_2 = Classification(\"premise\",\"hypothesis\",\"label\",dataset_name=\"tasksource/logiqa-2.0-nli\")\n\n_oasst = dict(dataset_name=\"tasksource/oasst2_dense_flat\",\n    pre_process = lambda ds:ds.filter(lambda x:x['lang']=='en'))\n\noasst1__quality = Classification(\"parent_text\",\"text\",labels=\"quality\",**_oasst)\noasst1__toxicity = Classification(\"parent_text\",\"text\",labels=\"toxicity\",**_oasst)\noasst1__helpfulness = Classification(\"parent_text\",\"text\",labels=\"helpfulness\",**_oasst)\n\nmindgames = Classification(\"premise\",\"hypothesis\",\"label\",dataset_name=\"sileod/mindgames\")\n\ndef _udep_post_process(ds):\n    return ds.cast_column('labels', Sequence(ClassLabel(names=udep_en_labels)))\n\nudep__deprel = TokenClassification('tokens',lambda x:[udep_en_labels.index(a) for a in x['deprel']],\n    config_name=udep_en_configs,dataset_name=\"universal_dependencies\",post_process=_udep_post_process)\n\nambient= Classification(\"premise\",\"hypothesis\",\"hypothesis_ambiguous\",dataset_name=\"metaeval/ambient\")\n\npath_naturalness = MultipleChoice(constant(\"\"),choices=['choice1','choice2'],labels=\"label\",\n    dataset_name=\"metaeval/path-naturalness-prediction\")\n\ncivil_comments__toxicity = Classification(\"text\",labels=\"toxicity\")\ncivil_comments__severe_toxicity = Classification(\"text\",labels=\"severe_toxicity\")\ncivil_comments__obscene = Classification(\"text\",labels=\"obscene\")\ncivil_comments__threat = Classification(\"text\",labels=\"threat\")\ncivil_comments__insult = Classification(\"text\",labels=\"insult\")\ncivil_comments__identity_attack = Classification(\"text\",labels=\"identity_attack\")\ncivil_comments__sexual_explicit = Classification(\"text\",labels=\"sexual_explicit\")\n\ncloth = MultipleChoice(\"sentence\", choices_list=lambda x:[x[\"answer\"]]+x[\"distractors\"],labels=constant(0), dataset_name=\"AndyChiang/cloth\")\ndgen  = MultipleChoice(\"sentence\", choices_list=lambda x:[x[\"answer\"]]+x[\"distractors\"],labels=constant(0), dataset_name=\"AndyChiang/dgen\")\n\ni2d2 = Classification(\"sentence1\",labels=name('label',['False','True']), dataset_name=\"tasksource/I2D2\")\n\narg_me = Classification('argument','conclusion','stance', dataset_name=\"webis/args_me\")\nvalueeval_stance = Classification(\"Premise\",\"Conclusion\",\"Stance\", dataset_name=\"webis/Touche23-ValueEval\")\nstarcon = Classification('argument','topic','label',dataset_name=\"tasksource/starcon\")\n\nbanking77 = Classification(\"text\",labels=\"label\",dataset_name=\"PolyAI/banking77\")\n    \ncontrol = Classification('premise','hypothesis',\"label\",dataset_name=\"tasksource/ConTRoL-nli\")\ntracie = Classification(\"premise\",\"hypothesis\",\"answer\",dataset_name='tasksource/tracie')\nsherliic = Classification(\"premise\",\"hypothesis\",\"label\",dataset_name='tasksource/sherliic')\n\nsen_making__1 = MultipleChoice(constant('Chose most plausible:'), choices=['sentence0','sentence1'],labels='false', \n    dataset_name=\"tasksource/sen-making\")\n\nsen_making__2 = MultipleChoice(lambda x: [x['sentence0'],x['sentence1']][x['false']] + '\\n is not plausible because :',\n    choices=['A','B','C'],labels=lambda x: 'ABC'.index(x['reason']), dataset_name=\"tasksource/sen-making\")\n\nwinowhy = Classification('sentence', lambda x: f'In \"{x[\"wnli_sent1\"]}\", {x[\"wnli_sent2\"]}',\n    labels=name('label',['False','True']), dataset_name=\"tasksource/winowhy\")\n\n#for CFG in \"cognitive-bias\", \"fake-news\", \"gender-bias\", \"hate-speech\", \"linguistic-bias\", \"political-bias\", \"racial-bias\", \"text-level-bias\":\n#    print(f\"mbib__{CFG.replace('-','_')} = Classification('text',labels=name('label',['not {CFG}','{CFG}']), dataset_name='mediabiasgroup/mbib-base', config_name='{CFG}')\")\n\n\"\"\"\nmbib_cognitive_bias\t= Classification('text',labels=name('label',['not cognitive-bias','cognitive-bias']), dataset_name='mediabiasgroup/mbib-base', config_name='cognitive-bias')\nmbib_fake_news\t= Classification('text',labels=name('label',['not fake-news','fake-news']), dataset_name='mediabiasgroup/mbib-base', config_name='fake-news')\nmbib_gender_bias\t= Classification('text',labels=name('label',['not gender-bias','gender-bias']), dataset_name='mediabiasgroup/mbib-base', config_name='gender-bias')\nmbib_hate_speech\t= Classification('text',labels=name('label',['not hate-speech','hate-speech']), dataset_name='mediabiasgroup/mbib-base', config_name='hate-speech')\nmbib_linguistic_bias\t= Classification('text',labels=name('label',['not linguistic-bias','linguistic-bias']), dataset_name='mediabiasgroup/mbib-base', config_name='linguistic-bias')\nmbib_political_bias\t= Classification('text',labels=name('label',['not political-bias','political-bias']), dataset_name='mediabiasgroup/mbib-base', config_name='political-bias')\nmbib_racial_bias\t= Classification('text',labels=name('label',['not racial-bias','racial-bias']), dataset_name='mediabiasgroup/mbib-base', config_name='racial-bias')\nmbib_text_level_bias\t= Classification('text',labels=name('label',['not text-level-bias','text-level-bias']), dataset_name='mediabiasgroup/mbib-base', config_name='text-level-bias')\n\"\"\"\n\nrobustLR = Classification(\"context\",\"statement\",\"label\", dataset_name=\"tasksource/robustLR\")\n\ncluttr = Classification(\"story\",\"query\", \"target_text\",dataset_name=\"CLUTRR/v1\", config_name=\"gen_train234_test2to10\")\n\nlogical_fallacy = Classification(\"source_article\", labels=\"logical_fallacies\", dataset_name=\"tasksource/logical-fallacy\")\n\nparade = Classification(\"Definition1\",\"Definition2\", labels=name('Binary labels',[\"not-paraphrase\",\"paraphrase\"]), dataset_name=\"tasksource/parade\")\n\ncladder = Classification(\"given_info\", \"question\", \"answer\",dataset_name=\"tasksource/cladder\")\n\nsubjectivity = Classification(\"Sentence\",labels=\"Label\",dataset_name=\"tasksource/subjectivity\")\n\nmoh   = Classification(\"context\",\"expression\",\"label\", dataset_name=\"tasksource/MOH\")\nvuac  = Classification(\"context\",\"expression\",\"label\", dataset_name=\"tasksource/VUAC\")\ntrofi = Classification(\"context\",\"expression\",\"label\", dataset_name=\"tasksource/TroFi\", splits=['train',None,'test'])\n\nsharc_classification = Classification(\"snippet\", lambda x:f'{x[\"scenario\"]}\\n{x[\"question\"]}',\n    labels=lambda x:x[\"answer\"] if x['answer'] in  {\"Yes\",\"No\",\"Irrelevant\"} else \"Clarification needed\",\n    dataset_name='sharc_modified',config_name='mod')\n\nconceptrules_v2 = Classification(\"context\", \"text\", \"label\", dataset_name=\"tasksource/conceptrules_v2\")\n\nscidtb = Classification(\"unit1_txt\",\"unit2_txt\",\"label\", dataset_name=\"metaeval/disrpt\",config_name='eng.dep.scidtb.rels')\n\nchunking = TokenClassification(\"tokens\",\"chunk_tags\", dataset_name=\"conll2000\")\n\nfew_nerd = TokenClassification(\"tokens\",\"fine_ner_tags\",dataset_name=\"DFKI-SLT/few-nerd\",config_name='supervised')\nfiner = TokenClassification('tokens','ner_tags',dataset_name='nlpaueb/finer-139')\n\nlabel_nli = Classification(\"premise\",\"hypothesis\",\"labels\",dataset_name='tasksource/zero-shot-label-nli')\n\ncom2sense = Classification(\"sent\",labels=\"label\",dataset_name=\"tasksource/com2sense\",splits=['train',\"validation\",None])\n\nscone = Classification('sentence1_edited','sentence2_edited','gold_label_edited',dataset_name=\"tasksource/scone\")\n\nwinodict = MultipleChoice(cat(['definition','sentence']),['option1','option2'],'label',dataset_name='tasksource/winodict')\n\nfool_me_twice = Classification(\n    lambda x: \" \".join(a['text'] for a in x['gold_evidence']),\n    'text', 'label', dataset_name='tasksource/fool-me-twice')\n\nmonli = Classification(\"sentence1\",\"sentence2\",\"gold_label\", dataset_name=\"tasksource/monli\")\n\ncausality = Classification('premise','hypothesis','relation', dataset_name='tasksource/corr2cause')\n\nlsat = MultipleChoice(cat(['passage','question']), choices_list='references',labels='gold_index',dataset_name='lighteval/lsat_qa',config_name='all')\n\napt = Classification('text_a','text_b',name('labels',['not_paraphrase','paraphrase']),dataset_name='tasksource/apt')\n\n#xsum_factuality = Classification(\"summary\",labels=\"is_factual\")\n\nfinancial_sentiment = Classification(\"text\",labels=name('label',['Bearish','Bullish','Neutral']),\n    dataset_name=\"zeroshot/twitter-financial-news-sentiment\")\n\ndef _icl_rand(x):\n    import random\n    return random.Random(x['sentence1'][:50]).randint(0,1) #deterministic label for each input\n\nicl = Classification(\"inputs\", lambda x: x['symbols'][_icl_rand(x)],\n    labels=lambda x: str(x['symbols'][_icl_rand(x)]==x['targets']),\n    dataset_name=\"tasksource/icl-symbol-tuning-instruct\",\n    pre_process=lambda ds:ds.filter(lambda x:len(x['inputs'])<500*4), # 500 tokens of 4 char \n)\n\nspace_nli = Classification(\"premises\",\"hypothesis\",\"label\",dataset_name=\"tasksource/SpaceNLI\")\n\npropsegment = Classification(\"hypothesis\",\"premise\",\n    labels = lambda x:{'n':'neutral','e':'entailment','c':'contradiction'}[x['label']],\n    dataset_name=\"sihaochen/propsegment\",config_name='nli')\n\nhatemoji = Classification('text',labels=name(\"label_gold\", ['not-hate-speech','hate-speech']),\n    dataset_name=\"HannahRoseKirk/HatemojiBuild\")\n\nregset = Classification(\"context\",labels=\"answer\",dataset_name='tasksource/regset')\n\nesci = Classification('query','product_text','esci_label',\n    dataset_name=\"tasksource/esci\",\n    pre_process=lambda ds:ds.filter(lambda x:x['product_locale']=='us'))\n\ndef _preprocess_chatbot_arena(ds):\n    ds=ds.filter(lambda x:x['winner'] in [\"model_a\",\"model_b\"])\n    ds=ds.filter(lambda x:x['language']==\"English\")\n\n    def _unroll(x):\n        f=lambda x:\"\\n\".join([f\"{turn['role']}:\\n{turn['content']}\" for turn in x])\n        x['conversation_a'] = f(x['conversation_a'])\n        x['conversation_b'] = f(x['conversation_b'])\n        return x\n    ds=ds.map(_unroll)\n    return ds\n\nchatbot_arena = MultipleChoice(constant(\"\"),\n    choices=[\"conversation_a\",\"conversation_b\"],\n    labels=lambda x: [\"model_a\",\"model_b\"].index(x[\"winner\"]),\n    dataset_name=\"lmsys/chatbot_arena_conversations\",\n    pre_process=_preprocess_chatbot_arena)\n\ndnd_intent = Classification(\"examples\",labels=\"label_names\",\n    dataset_name='neurae/dnd_style_intents')\n\nfld = Classification(\"context\",\"hypothesis\", \"proof_label\",\n    dataset_name=\"hitachi-nlp/FLD.v2\",config_name=\"default\")\n\nflds = Classification(\"context\",\"hypothesis\", \"proof_label\",\n    dataset_name=\"hitachi-nlp/FLD.v2\",config_name=\"star\")\n\nsdoh_nli = Classification(\"premise\",\"hypothesis\",labels=lambda x:{True:\"entailment\",False:\"not_entailment\"}[x['label']],\n    dataset_name=\"tasksource/SDOH-NLI\")\n\nscifact_entailment = Classification(lambda x:\"\\n\".join(x[\"abstract\"]),\"claim\",\n    labels=lambda x:x['verdict'].replace('NEI','NEUTRAL').lower(),\n    dataset_name=\"allenai/scifact_entailment\")\n\nfeasibilityQA = Classification(cat(['knowledge','premise']),'hypothesis','binary_classification_label',\n    dataset_name=\"tasksource/feasibilityQA\")\n                               \nsimple_pair = Classification(\"premise\",\"hypothesis\",\"label\", dataset_name=\"tasksource/simple_pair\")\nadjective_scale_probe = Classification(\"premise\",\"hypothesis\",\"label\", dataset_name=\"tasksource/AdjectiveScaleProbe-nli\")\nrepectively_nli = Classification(\"premise\",\"hypothesis\",\"label\",dataset_name=\"tasksource/resnli\")\n\nspartun=MultipleChoice(cat([\"story\",\"question\"]),choices_list=\"candidate_answers\",\n    labels=lambda x: [c.lower() for c in x['choices_list']].index(x[\"answer\"][0].lower()),\n    pre_process=lambda ds:ds.filter(lambda x:len(x['answer'])==1),\n    dataset_name=\"tasksource/SpaRTUN\")\n\nresq=MultipleChoice(cat([\"story\",\"question\"]),choices_list=\"candidate_answers\",\n    labels=lambda x: [c.lower() for c in x['choices_list']].index(x[\"answer\"][0].lower()),\n    pre_process=lambda ds:ds.filter(lambda x:len(x['answer'])==1),\n    dataset_name=\"tasksource/ReSQ\")\n\nsemantic_fragments_nli = Classification(\"sentence1\",\"sentence2\",\"gold_label\",\n    dataset_name=\"tasksource/semantic_fragments_nli\")\n\nmoritz_zs_nli = Classification('text','hypothesis','labels',\n    pre_process=lambda ds:ds.filter(lambda x:x['task_name'] not in  [\"mnli\", \"anli\", \"fevernli\", \"wanli\", \"lingnli\"]),\n    dataset_name=\"MoritzLaurer/dataset_train_nli\"\n) \n\nstepgame = Classification('story','question','label',dataset_name=\"tasksource/stepgame\")\n\ndef _nlgraph_binarize(x):\n    a=x['answer'].lower()\n    if \"yes\" in a: return \"True\"\n    if \"no\" in a: return \"False\"\n    assert False\n\nnlgraph = Classification('question',labels=_nlgraph_binarize,\n    pre_process=lambda ds:ds.filter(lambda x:x['task'] in \"connectivity cycle hamilton\"),\n    dataset_name=\"tasksource/nlgraph\")\n\noasst_rlhf = MultipleChoice(\"prompt\",choices=['chosen','rejected'],labels=constant(0),\n    dataset_name=\"tasksource/oasst2_pairwise_rlhf_reward\")\n\nanthropic_rlhf_helpfulness = MultipleChoice(constant('Most helpful assistant answer:'), ['chosen','rejected'], constant(0),\n    dataset_name=\"tasksource/hh-rlhf\",config_name=[\"helpful-base\", \"helpful-online\", \"helpful-rejection-sampled\"])\n\nanthropic_rlhf_harmless = MultipleChoice(constant('Most harmless assistant answer:'), ['chosen','rejected'], constant(0),\n    dataset_name=\"tasksource/hh-rlhf\",config_name=\"harmless-base\")\n\nruletaker = Classification(\n    lambda x: 'What is not explicitly stated as true is considered false. \\n' +x[\"context\"], #closed world assumption\n    \"question\",\"label\",dataset_name=\"tasksource/ruletaker\")\n\npara_rules = Classification(\n    lambda x: 'What is not explicitly stated as true is considered false. \\n' +x[\"context\"], #closed world assumption\n    \"question\", labels=name(\"label\",[\"False\",\"True\"]),\n    dataset_name=\"qbao775/PARARULE-Plus\")\n\nproofwriter_deduction = Classification(\"theory\",\"question\",\"answer\",\n    dataset_name=\"tasksource/proofwriter\") #open world assumption\n\nlogical_entailment = Classification(\"A\",\"B\",\"label\",dataset_name='tasksource/logical-entailment')\n\nnope = Classification('premise','hypothesis',\n    labels=lambda x:dict(E='entailment',N='neutral',C='contradiction').get(x['label'],x['label']),\n    dataset_name='tasksource/nope')\n\nlogicNLI = Classification('premise','hypothesis','label',dataset_name='tasksource/LogicNLI')\n\ncontract_nli__seg = Classification(\"premise\",\"hypothesis\",\"label\", dataset_name=\"kiddothe2b/contract-nli\",config_name=\"contractnli_a\")\n\ncontract_nli__full = Classification(\"premise\",\"hypothesis\",\"label\", dataset_name=\"kiddothe2b/contract-nli\",config_name=\"contractnli_b\")\n\nnli4ct = Classification(lambda x: \"\\n\".join(x['Primary_evidence']),'Statement',\"Label\",\n    dataset_name=\"AshtonIsNotHere/nli4ct_semeval2024\",splits=['train','dev',None])\n\nlsat_ar = MultipleChoice(\n    cat(['context','question']),\n    choices_list='answers',labels=\"label\",\n     dataset_name=\"tasksource/lsat-ar\")\n    \nlsat_rc = MultipleChoice(\n    cat(['context','question']),\n    choices_list='answers',labels=\"label\",\n     dataset_name=\"tasksource/lsat-rc\")\n    \nbiosift_nli = Classification(\"Abstract\",\"Hypothesis\",\n    labels=lambda x: {True:\"entailment\",False:\"not-entailment\"}[bool(x['Entailment'])],\n    dataset_name=\"AshtonIsNotHere/biosift-nli\")\n\nbrainteasers = MultipleChoice(\"question\",\n    choices_list=lambda x:eval(x[\"choice_list\"]),\n    labels=\"label\",\n    dataset_name=\"tasksource/brainteasers\",config_name=['WP','SP'])\n\n#GATED !\n#toxigen = Classification(\"text\",labels=\"toxicity_human\", dataset_name=\"skg/toxigen-data\")\n\npersuasiveness = Classification(\"claim\",\"argument\",labels=\"persuasiveness_metric\",dataset_name=\"Anthropic/persuasion\")\n\n#ste_wic = Classification(cat(\"text_1\",\"text_2\"),\n#    lambda x:f\"{x['target']} means the same thing in these texts\",\n#    \"gold_label_binary\",\n#    dataset_name=\"cardiffnlp/super_tweeteval\", config_name=\"tempo_wic\",splits=['train','validation',None])\n\n#ste_nerd = Classification(\"text\",\n#    lambda x:f\"definition of {x['target']} here is 'x{['definition']}'\",\n#    \"gold_label_binary\",\n#    dataset_name=\"cardiffnlp/super_tweeteval\", config_name=\"tweet_nerd\",splits=['train','validation',None])\n \n#ste_sim = Classification(\"text_1\",\"text_2\",lambda x:x['gold_score']/5,\n#    dataset_name=\"cardiffnlp/super_tweeteval\",config_name=\"tweet_similarity\",splits=['train','validation',None])\n\n#ste_intimacy = Classification(\"text_1\",labels=lambda x:x['gold_score']/5,\n#    dataset_name=\"cardiffnlp/super_tweeteval\",config_name=\"tweet_intimacy\")\n\n#ccdv/patent-classification|abstract text label\n\nambigNQ = Classification(\"question\",labels=lambda x:{True:\"ambiguous\", False:\"not ambiguous\"}.get(x[\"ambig\"]),\n    dataset_name=\"erbacher/AmbigNQ-clarifying-question\")\n\nsiga_nli = Classification(\"premise\",\"statement\",\"label\",dataset_name=\"tasksource/SIGA-nli\")\n\nunigram_fol = Classification(\"premise\",\"hypothesis\",\"label\",dataset_name='unigram/FOL-nli')\n\n#gs_goal = MultipleChoice(\"sent2\",regen(\"ending[0-3]\"),\"label\",\n#        dataset_name=\"tasksource/goal-step-wikihow\",config_name=\"goal\")\n\n#gs_step = MultipleChoice(\"sent2\",regen(\"ending[0-3]\"),\"label\",\n#        dataset_name=\"tasksource/goal-step-wikihow\",config_name=\"step\")\n\ngs_order = MultipleChoice(\"sent2\",regen(\"ending[0-1]\"),\"label\",\n        dataset_name=\"tasksource/goal-step-wikihow\",config_name=\"order\")\n\nparadise = MultipleChoice(\"sent2\",regen(\"ending[0-3]\"),\"label\",\n      dataset_name=\"GGLab/PARADISE\")\n\ndocnli = Classification(\"premise\",\"hypothesis\",\"label\",dataset_name=\"tasksource/doc-nli\")\n\nmctest_nli = Classification(\"premise\",\"hypothesis\",\"label\",dataset_name=\"tasksource/mctest-nli\")\n\npatent_phrase_similarity = Classification(\"anchor\",\"target\",\"label\",dataset_name=\"tasksource/patent-phrase-similarity\")\n\nnlsat = Classification('sentence',labels='label',dataset_name=\"tasksource/natural-language-satisfiability\")\n\nidioms_nli = Classification('premise','hypothesis','label',dataset_name=\"tasksource/idioms-nli\")\n\nlifeycle_entailment = Classification(\"premise\",\"hypothesis\",\"label\",dataset_name='tasksource/lifecycle-entailment')\n\n\nhelpsteer__helpfulness = Classification(\"prompt\", \"response\", \"helpfulness\", dataset_name=\"nvidia/HelpSteer\")\nhelpsteer__correctness = Classification(\"prompt\", \"response\", \"correctness\", dataset_name=\"nvidia/HelpSteer\")\nhelpsteer__coherence = Classification(\"prompt\", \"response\", \"coherence\", dataset_name=\"nvidia/HelpSteer\")\nhelpsteer__complexity = Classification(\"prompt\", \"response\", \"complexity\", dataset_name=\"nvidia/HelpSteer\")\nhelpsteer__verbosity = Classification(\"prompt\", \"response\", \"verbosity\", dataset_name=\"nvidia/HelpSteer\")\n\nhelpsteer_2__helpfulness = Classification(\"prompt\",\"response\",\"helpfulness\",dataset_name=\"nvidia/HelpSteer2\")\nhelpsteer_2__correctness = Classification(\"prompt\", \"response\", \"correctness\", dataset_name=\"nvidia/HelpSteer2\")\nhelpsteer_2__coherence = Classification(\"prompt\", \"response\", \"coherence\", dataset_name=\"nvidia/HelpSteer2\")\nhelpsteer_2__complexity = Classification(\"prompt\", \"response\", \"complexity\", dataset_name=\"nvidia/HelpSteer2\")\nhelpsteer_2__verbosity = Classification(\"prompt\", \"response\", \"verbosity\", dataset_name=\"nvidia/HelpSteer2\")\n\nmsci_nli = Classification('sentence1','sentence2','label',dataset_name='sadat2307/MSciNLI')\n\n#lex_glue___ecthr_a = Classification(sentence1=\"text\", labels=\"labels\",dataset_name=\"coastalcph/lex_glue\",config_name=\"ecthr_a\") # too long\n#lex_glue___ecthr_b = Classification(sentence1=\"text\", labels=\"labels\") # too long\n\nultrafeedback = MultipleChoice(\"question\", choices=['response_j','response_k'],labels=constant(0), dataset_name=\"pushpdeep/UltraFeedback-paired\")\n\nessay_scoring = Classification(\"full_text\",labels=\"score\",dataset_name='tasksource/AES2-essay-scoring')\n\n#argument_feedback = Classification(\"discourse_text\",labels=\"discourse_effectiveness\", dataset_name=\"tasksource/argument-feedback\")\n\neg = lambda x: Classification(\"full_text\", labels=lambda y:int(y[x]), dataset_name=\"tasksource/english-grading\")\ngrading__cohesion = eg('cohesion')\ngrading__syntax = eg('syntax')\ngrading__vocabulary = eg('vocabulary')\ngrading__phraseology = eg('phraseology')\ngrading__grammar = eg('grammar')\ngrading__conventions = eg('conventions')\n\nwice = Classification(lambda x: \"\\n\".join(x['evidence']),'claim','label',\n    dataset_name='tasksource/wice')\n\nhover = Classification(\"evidence\",\"claim\",\"label\",\n    dataset_name=\"Dzeniks/hover\") \n\nhover__nli = Classification(\"evidence\",\"claim\",name(\"label\",[\"entailment\",\"neutral\",\"contradiction\"]),\n    dataset_name=\"Dzeniks/hover-3way\")\n\ntasksource_dpo = MultipleChoice(\"prompt\",choices=['chosen','rejected'],labels=constant(0),\n    dataset_name=\"tasksource/tasksource_dpo_pairs\")\n\nseahorse = Classification('article',cat([\"summary\", \"question\"]),'answer',\n    dataset_name=\"tasksource/seahorse_summarization_evaluation\")\n\nmip = Classification(\"prompt\",labels=\"y\",\n    dataset_name=\"sileod/missing-item-prediction\",config_name=\"contrastive\")\n\njigsaw_toxicity = Classification('comment_text',labels=name(\"toxic\",[\"notthate\",\"hate\"]),\n    dataset_name=\"tasksource/jigsaw_toxicity\")\n\npol_nli = Classification(\"premise\",\"hypothesis\",labels=name('entailment',['entailment','not_entailment']),\n    dataset_name=\"mlburnham/Pol_NLI\")\n\nsynthetic_retrieval_nli = Classification('premise','hypothesis','label',dataset_name='tasksource/synthetic-retrieval-NLI',\n    config_name=[\"binary\",\"count\",\"position\"],\n    pre_process=lambda ds:ds.filter(lambda x:x['n']<=2048))\n\nissue_similarity = Classification(\"text1\",\"text2\",\"label\",\n    dataset_name=\"WhereIsAI/github-issue-similarity\")\n\n#nli_l2 = Classification(\"sentence1\",\"sentence2\",\"labels\",\n#    dataset_name=\"tasksource/merged-2l-nli\")\n\n#nli_l3 =  Classification(\"sentence1\",\"sentence2\",\"labels\",\n#    dataset_name=\"tasksource/merged-3l-nli\")\n"
  },
  {
    "path": "tasks.md",
    "content": "|     | id                                                                   | dataset_name                                 | config_name                                         | task_name       | preprocessing_name                           | task_type           |\n|----:|:---------------------------------------------------------------------|:---------------------------------------------|:----------------------------------------------------|:----------------|:---------------------------------------------|:--------------------|\n|   0 | glue/mnli                                                            | glue                                         | mnli                                                |                 | glue___mnli                                  | Classification      |\n|   1 | glue/qnli                                                            | glue                                         | qnli                                                |                 | glue___qnli                                  | Classification      |\n|   2 | glue/rte                                                             | glue                                         | rte                                                 |                 | glue___rte                                   | Classification      |\n|   3 | glue/wnli                                                            | glue                                         | wnli                                                |                 | glue___wnli                                  | Classification      |\n|   4 | glue/mrpc                                                            | glue                                         | mrpc                                                |                 | glue___mrpc                                  | Classification      |\n|   5 | glue/qqp                                                             | glue                                         | qqp                                                 |                 | glue___qqp                                   | Classification      |\n|   6 | glue/stsb                                                            | glue                                         | stsb                                                |                 | glue___stsb                                  | Classification      |\n|   7 | super_glue/boolq                                                     | super_glue                                   | boolq                                               |                 | super_glue___boolq                           | Classification      |\n|   8 | super_glue/cb                                                        | super_glue                                   | cb                                                  |                 | super_glue___cb                              | Classification      |\n|   9 | super_glue/multirc                                                   | super_glue                                   | multirc                                             |                 | super_glue___multirc                         | Classification      |\n|  10 | super_glue/wic                                                       | super_glue                                   | wic                                                 |                 | super_glue___wic                             | Classification      |\n|  11 | super_glue/axg                                                       | super_glue                                   | axg                                                 |                 | super_glue___axg                             | Classification      |\n|  12 | anli/a1                                                              | anli                                         |                                                     | a1              | anli__a1                                     | Classification      |\n|  13 | anli/a2                                                              | anli                                         |                                                     | a2              | anli__a2                                     | Classification      |\n|  14 | anli/a3                                                              | anli                                         |                                                     | a3              | anli__a3                                     | Classification      |\n|  15 | babi_nli/basic-coreference                                           | tasksource/babi_nli                          | basic-coreference                                   |                 | babi_nli                                     | Classification      |\n|  16 | babi_nli/time-reasoning                                              | tasksource/babi_nli                          | time-reasoning                                      |                 | babi_nli                                     | Classification      |\n|  17 | babi_nli/conjunction                                                 | tasksource/babi_nli                          | conjunction                                         |                 | babi_nli                                     | Classification      |\n|  18 | babi_nli/lists-sets                                                  | tasksource/babi_nli                          | lists-sets                                          |                 | babi_nli                                     | Classification      |\n|  19 | babi_nli/positional-reasoning                                        | tasksource/babi_nli                          | positional-reasoning                                |                 | babi_nli                                     | Classification      |\n|  20 | babi_nli/yes-no-questions                                            | tasksource/babi_nli                          | yes-no-questions                                    |                 | babi_nli                                     | Classification      |\n|  21 | babi_nli/simple-negation                                             | tasksource/babi_nli                          | simple-negation                                     |                 | babi_nli                                     | Classification      |\n|  22 | babi_nli/three-arg-relations                                         | tasksource/babi_nli                          | three-arg-relations                                 |                 | babi_nli                                     | Classification      |\n|  23 | babi_nli/two-supporting-facts                                        | tasksource/babi_nli                          | two-supporting-facts                                |                 | babi_nli                                     | Classification      |\n|  24 | babi_nli/path-finding                                                | tasksource/babi_nli                          | path-finding                                        |                 | babi_nli                                     | Classification      |\n|  25 | babi_nli/two-arg-relations                                           | tasksource/babi_nli                          | two-arg-relations                                   |                 | babi_nli                                     | Classification      |\n|  26 | babi_nli/basic-deduction                                             | tasksource/babi_nli                          | basic-deduction                                     |                 | babi_nli                                     | Classification      |\n|  27 | babi_nli/basic-induction                                             | tasksource/babi_nli                          | basic-induction                                     |                 | babi_nli                                     | Classification      |\n|  28 | babi_nli/single-supporting-fact                                      | tasksource/babi_nli                          | single-supporting-fact                              |                 | babi_nli                                     | Classification      |\n|  29 | babi_nli/three-supporting-facts                                      | tasksource/babi_nli                          | three-supporting-facts                              |                 | babi_nli                                     | Classification      |\n|  30 | babi_nli/compound-coreference                                        | tasksource/babi_nli                          | compound-coreference                                |                 | babi_nli                                     | Classification      |\n|  31 | babi_nli/counting                                                    | tasksource/babi_nli                          | counting                                            |                 | babi_nli                                     | Classification      |\n|  32 | babi_nli/size-reasoning                                              | tasksource/babi_nli                          | size-reasoning                                      |                 | babi_nli                                     | Classification      |\n|  33 | babi_nli/indefinite-knowledge                                        | tasksource/babi_nli                          | indefinite-knowledge                                |                 | babi_nli                                     | Classification      |\n|  34 | sick/label                                                           | sick                                         |                                                     | label           | sick__label                                  | Classification      |\n|  35 | sick/relatedness                                                     | sick                                         |                                                     | relatedness     | sick__relatedness                            | Classification      |\n|  36 | sick/entailment_AB                                                   | sick                                         |                                                     | entailment_AB   | sick__entailment_AB                          | Classification      |\n|  37 | snli                                                                 | snli                                         |                                                     |                 | snli                                         | Classification      |\n|  38 | scitail/snli_format                                                  | scitail                                      | snli_format                                         |                 | scitail                                      | Classification      |\n|  39 | hans                                                                 | hans                                         |                                                     |                 | hans                                         | Classification      |\n|  40 | WANLI                                                                | alisawuffles/WANLI                           |                                                     |                 | wanli                                        | Classification      |\n|  41 | recast/recast_puns                                                   | tasksource/recast                            | recast_puns                                         |                 | recast_nli                                   | Classification      |\n|  42 | recast/recast_verbcorner                                             | tasksource/recast                            | recast_verbcorner                                   |                 | recast_nli                                   | Classification      |\n|  43 | recast/recast_verbnet                                                | tasksource/recast                            | recast_verbnet                                      |                 | recast_nli                                   | Classification      |\n|  44 | recast/recast_factuality                                             | tasksource/recast                            | recast_factuality                                   |                 | recast_nli                                   | Classification      |\n|  45 | recast/recast_ner                                                    | tasksource/recast                            | recast_ner                                          |                 | recast_nli                                   | Classification      |\n|  46 | recast/recast_megaveridicality                                       | tasksource/recast                            | recast_megaveridicality                             |                 | recast_nli                                   | Classification      |\n|  47 | recast/recast_sentiment                                              | tasksource/recast                            | recast_sentiment                                    |                 | recast_nli                                   | Classification      |\n|  48 | recast/recast_kg_relations                                           | tasksource/recast                            | recast_kg_relations                                 |                 | recast_nli                                   | Classification      |\n|  49 | probability_words_nli/reasoning_1hop                                 | sileod/probability_words_nli                 | reasoning_1hop                                      |                 | probability_words_nli                        | Classification      |\n|  50 | probability_words_nli/reasoning_2hop                                 | sileod/probability_words_nli                 | reasoning_2hop                                      |                 | probability_words_nli                        | Classification      |\n|  51 | probability_words_nli/usnli                                          | sileod/probability_words_nli                 | usnli                                               |                 | probability_words_nli                        | Classification      |\n|  52 | nan-nli                                                              | joey234/nan-nli                              |                                                     |                 | nan_nli                                      | Classification      |\n|  53 | nli_fever                                                            | pietrolesci/nli_fever                        |                                                     |                 | nli_fever                                    | Classification      |\n|  54 | breaking_nli                                                         | pietrolesci/breaking_nli                     |                                                     |                 | breaking_nli                                 | Classification      |\n|  55 | conj_nli                                                             | pietrolesci/conj_nli                         |                                                     |                 | conj_nli                                     | Classification      |\n|  56 | fracas                                                               | pietrolesci/fracas                           |                                                     |                 | fracas                                       | Classification      |\n|  57 | dialogue_nli                                                         | pietrolesci/dialogue_nli                     |                                                     |                 | dialogue_nli                                 | Classification      |\n|  58 | mpe                                                                  | pietrolesci/mpe                              |                                                     |                 | mpe_nli                                      | Classification      |\n|  59 | dnc                                                                  | pietrolesci/dnc                              |                                                     |                 | dnc_nli                                      | Classification      |\n|  60 | recast_white/fnplus                                                  | pietrolesci/recast_white                     |                                                     | fnplus          | recast_white__fnplus                         | Classification      |\n|  61 | recast_white/sprl                                                    | pietrolesci/recast_white                     |                                                     | sprl            | recast_white__sprl                           | Classification      |\n|  62 | recast_white/dpr                                                     | pietrolesci/recast_white                     |                                                     | dpr             | recast_white__dpr                            | Classification      |\n|  63 | joci                                                                 | pietrolesci/joci                             |                                                     |                 | joci                                         | Classification      |\n|  64 | robust_nli/IS_CS                                                     | pietrolesci/robust_nli                       |                                                     | IS_CS           | robust_nli__IS_CS                            | Classification      |\n|  65 | robust_nli/LI_LI                                                     | pietrolesci/robust_nli                       |                                                     | LI_LI           | robust_nli__LI_LI                            | Classification      |\n|  66 | robust_nli/ST_WO                                                     | pietrolesci/robust_nli                       |                                                     | ST_WO           | robust_nli__ST_WO                            | Classification      |\n|  67 | robust_nli/PI_SP                                                     | pietrolesci/robust_nli                       |                                                     | PI_SP           | robust_nli__PI_SP                            | Classification      |\n|  68 | robust_nli/PI_CD                                                     | pietrolesci/robust_nli                       |                                                     | PI_CD           | robust_nli__PI_CD                            | Classification      |\n|  69 | robust_nli/ST_SE                                                     | pietrolesci/robust_nli                       |                                                     | ST_SE           | robust_nli__ST_SE                            | Classification      |\n|  70 | robust_nli/ST_NE                                                     | pietrolesci/robust_nli                       |                                                     | ST_NE           | robust_nli__ST_NE                            | Classification      |\n|  71 | robust_nli/ST_LM                                                     | pietrolesci/robust_nli                       |                                                     | ST_LM           | robust_nli__ST_LM                            | Classification      |\n|  72 | robust_nli_is_sd                                                     | pietrolesci/robust_nli_is_sd                 |                                                     |                 | robust_nli_is_sd                             | Classification      |\n|  73 | robust_nli_li_ts                                                     | pietrolesci/robust_nli_li_ts                 |                                                     |                 | robust_nli_li_ts                             | Classification      |\n|  74 | gen_debiased_nli/snli_seq_z                                          | pietrolesci/gen_debiased_nli                 |                                                     | snli_seq_z      | gen_debiased_nli__snli_seq_z                 | Classification      |\n|  75 | gen_debiased_nli/snli_z_aug                                          | pietrolesci/gen_debiased_nli                 |                                                     | snli_z_aug      | gen_debiased_nli__snli_z_aug                 | Classification      |\n|  76 | gen_debiased_nli/snli_par_z                                          | pietrolesci/gen_debiased_nli                 |                                                     | snli_par_z      | gen_debiased_nli__snli_par_z                 | Classification      |\n|  77 | gen_debiased_nli/mnli_par_z                                          | pietrolesci/gen_debiased_nli                 |                                                     | mnli_par_z      | gen_debiased_nli__mnli_par_z                 | Classification      |\n|  78 | gen_debiased_nli/mnli_z_aug                                          | pietrolesci/gen_debiased_nli                 |                                                     | mnli_z_aug      | gen_debiased_nli__mnli_z_aug                 | Classification      |\n|  79 | gen_debiased_nli/mnli_seq_z                                          | pietrolesci/gen_debiased_nli                 |                                                     | mnli_seq_z      | gen_debiased_nli__mnli_seq_z                 | Classification      |\n|  80 | add_one_rte                                                          | pietrolesci/add_one_rte                      |                                                     |                 | add_one_rte                                  | Classification      |\n|  81 | imppres/presupposition_possessed_definites_existence/presupposition  | tasksource/imppres                           | presupposition_possessed_definites_existence        | presupposition  | imppres__presupposition                      | Classification      |\n|  82 | imppres/presupposition_only_presupposition/presupposition            | tasksource/imppres                           | presupposition_only_presupposition                  | presupposition  | imppres__presupposition                      | Classification      |\n|  83 | imppres/presupposition_cleft_uniqueness/presupposition               | tasksource/imppres                           | presupposition_cleft_uniqueness                     | presupposition  | imppres__presupposition                      | Classification      |\n|  84 | imppres/presupposition_change_of_state/presupposition                | tasksource/imppres                           | presupposition_change_of_state                      | presupposition  | imppres__presupposition                      | Classification      |\n|  85 | imppres/presupposition_cleft_existence/presupposition                | tasksource/imppres                           | presupposition_cleft_existence                      | presupposition  | imppres__presupposition                      | Classification      |\n|  86 | imppres/presupposition_possessed_definites_uniqueness/presupposition | tasksource/imppres                           | presupposition_possessed_definites_uniqueness       | presupposition  | imppres__presupposition                      | Classification      |\n|  87 | imppres/presupposition_question_presupposition/presupposition        | tasksource/imppres                           | presupposition_question_presupposition              | presupposition  | imppres__presupposition                      | Classification      |\n|  88 | imppres/presupposition_both_presupposition/presupposition            | tasksource/imppres                           | presupposition_both_presupposition                  | presupposition  | imppres__presupposition                      | Classification      |\n|  89 | imppres/presupposition_all_n_presupposition/presupposition           | tasksource/imppres                           | presupposition_all_n_presupposition                 | presupposition  | imppres__presupposition                      | Classification      |\n|  90 | imppres/implicature_gradable_verb/prag                               | tasksource/imppres                           | implicature_gradable_verb                           | prag            | imppres__prag                                | Classification      |\n|  91 | imppres/implicature_numerals_10_100/prag                             | tasksource/imppres                           | implicature_numerals_10_100                         | prag            | imppres__prag                                | Classification      |\n|  92 | imppres/implicature_numerals_2_3/prag                                | tasksource/imppres                           | implicature_numerals_2_3                            | prag            | imppres__prag                                | Classification      |\n|  93 | imppres/implicature_modals/prag                                      | tasksource/imppres                           | implicature_modals                                  | prag            | imppres__prag                                | Classification      |\n|  94 | imppres/implicature_connectives/prag                                 | tasksource/imppres                           | implicature_connectives                             | prag            | imppres__prag                                | Classification      |\n|  95 | imppres/implicature_quantifiers/prag                                 | tasksource/imppres                           | implicature_quantifiers                             | prag            | imppres__prag                                | Classification      |\n|  96 | imppres/implicature_gradable_adjective/prag                          | tasksource/imppres                           | implicature_gradable_adjective                      | prag            | imppres__prag                                | Classification      |\n|  97 | imppres/implicature_connectives/log                                  | tasksource/imppres                           | implicature_connectives                             | log             | imppres__log                                 | Classification      |\n|  98 | imppres/implicature_modals/log                                       | tasksource/imppres                           | implicature_modals                                  | log             | imppres__log                                 | Classification      |\n|  99 | imppres/implicature_numerals_10_100/log                              | tasksource/imppres                           | implicature_numerals_10_100                         | log             | imppres__log                                 | Classification      |\n| 100 | imppres/implicature_quantifiers/log                                  | tasksource/imppres                           | implicature_quantifiers                             | log             | imppres__log                                 | Classification      |\n| 101 | imppres/implicature_numerals_2_3/log                                 | tasksource/imppres                           | implicature_numerals_2_3                            | log             | imppres__log                                 | Classification      |\n| 102 | imppres/implicature_gradable_adjective/log                           | tasksource/imppres                           | implicature_gradable_adjective                      | log             | imppres__log                                 | Classification      |\n| 103 | imppres/implicature_gradable_verb/log                                | tasksource/imppres                           | implicature_gradable_verb                           | log             | imppres__log                                 | Classification      |\n| 104 | hlgd                                                                 | hlgd                                         |                                                     |                 | hlgd                                         | Classification      |\n| 105 | paws/labeled_final                                                   | paws                                         | labeled_final                                       |                 | paws___labeled_final                         | Classification      |\n| 106 | paws/labeled_swap                                                    | paws                                         | labeled_swap                                        |                 | paws___labeled_swap                          | Classification      |\n| 107 | medical_questions_pairs                                              | medical_questions_pairs                      |                                                     |                 | medical_questions_pairs                      | Classification      |\n| 108 | conll2003/pos_tags                                                   | conll2003                                    |                                                     | pos_tags        | conll2003__pos_tags                          | TokenClassification |\n| 109 | conll2003/chunk_tags                                                 | conll2003                                    |                                                     | chunk_tags      | conll2003__chunk_tags                        | TokenClassification |\n| 110 | conll2003/ner_tags                                                   | conll2003                                    |                                                     | ner_tags        | conll2003__ner_tags                          | TokenClassification |\n| 111 | model-written-evals                                                  | Anthropic/model-written-evals                |                                                     |                 | model_written_evals                          | MultipleChoice      |\n| 112 | truthful_qa/multiple_choice                                          | truthful_qa                                  | multiple_choice                                     |                 | truthful_qa___multiple_choice                | MultipleChoice      |\n| 113 | fig-qa                                                               | nightingal3/fig-qa                           |                                                     |                 | fig_qa                                       | MultipleChoice      |\n| 114 | bigbench/conceptual_combinations                                     | tasksource/bigbench                          | conceptual_combinations                             |                 | bigbench                                     | MultipleChoice      |\n| 115 | bigbench/logical_sequence                                            | tasksource/bigbench                          | logical_sequence                                    |                 | bigbench                                     | MultipleChoice      |\n| 116 | bigbench/metaphor_understanding                                      | tasksource/bigbench                          | metaphor_understanding                              |                 | bigbench                                     | MultipleChoice      |\n| 117 | bigbench/identify_odd_metaphor                                       | tasksource/bigbench                          | identify_odd_metaphor                               |                 | bigbench                                     | MultipleChoice      |\n| 118 | bigbench/physical_intuition                                          | tasksource/bigbench                          | physical_intuition                                  |                 | bigbench                                     | MultipleChoice      |\n| 119 | bigbench/english_proverbs                                            | tasksource/bigbench                          | english_proverbs                                    |                 | bigbench                                     | MultipleChoice      |\n| 120 | bigbench/empirical_judgments                                         | tasksource/bigbench                          | empirical_judgments                                 |                 | bigbench                                     | MultipleChoice      |\n| 121 | bigbench/logical_args                                                | tasksource/bigbench                          | logical_args                                        |                 | bigbench                                     | MultipleChoice      |\n| 122 | bigbench/identify_math_theorems                                      | tasksource/bigbench                          | identify_math_theorems                              |                 | bigbench                                     | MultipleChoice      |\n| 123 | bigbench/moral_permissibility                                        | tasksource/bigbench                          | moral_permissibility                                |                 | bigbench                                     | MultipleChoice      |\n| 124 | bigbench/formal_fallacies_syllogisms_negation                        | tasksource/bigbench                          | formal_fallacies_syllogisms_negation                |                 | bigbench                                     | MultipleChoice      |\n| 125 | bigbench/gre_reading_comprehension                                   | tasksource/bigbench                          | gre_reading_comprehension                           |                 | bigbench                                     | MultipleChoice      |\n| 126 | bigbench/suicide_risk                                                | tasksource/bigbench                          | suicide_risk                                        |                 | bigbench                                     | MultipleChoice      |\n| 127 | bigbench/evaluating_information_essentiality                         | tasksource/bigbench                          | evaluating_information_essentiality                 |                 | bigbench                                     | MultipleChoice      |\n| 128 | bigbench/known_unknowns                                              | tasksource/bigbench                          | known_unknowns                                      |                 | bigbench                                     | MultipleChoice      |\n| 129 | bigbench/fact_checker                                                | tasksource/bigbench                          | fact_checker                                        |                 | bigbench                                     | MultipleChoice      |\n| 130 | bigbench/bbq_lite_json                                               | tasksource/bigbench                          | bbq_lite_json                                       |                 | bigbench                                     | MultipleChoice      |\n| 131 | bigbench/hyperbaton                                                  | tasksource/bigbench                          | hyperbaton                                          |                 | bigbench                                     | MultipleChoice      |\n| 132 | bigbench/international_phonetic_alphabet_nli                         | tasksource/bigbench                          | international_phonetic_alphabet_nli                 |                 | bigbench                                     | MultipleChoice      |\n| 133 | bigbench/emojis_emotion_prediction                                   | tasksource/bigbench                          | emojis_emotion_prediction                           |                 | bigbench                                     | MultipleChoice      |\n| 134 | bigbench/analytic_entailment                                         | tasksource/bigbench                          | analytic_entailment                                 |                 | bigbench                                     | MultipleChoice      |\n| 135 | bigbench/presuppositions_as_nli                                      | tasksource/bigbench                          | presuppositions_as_nli                              |                 | bigbench                                     | MultipleChoice      |\n| 136 | bigbench/social_support                                              | tasksource/bigbench                          | social_support                                      |                 | bigbench                                     | MultipleChoice      |\n| 137 | bigbench/crash_blossom                                               | tasksource/bigbench                          | crash_blossom                                       |                 | bigbench                                     | MultipleChoice      |\n| 138 | bigbench/play_dialog_same_or_different                               | tasksource/bigbench                          | play_dialog_same_or_different                       |                 | bigbench                                     | MultipleChoice      |\n| 139 | bigbench/movie_dialog_same_or_different                              | tasksource/bigbench                          | movie_dialog_same_or_different                      |                 | bigbench                                     | MultipleChoice      |\n| 140 | bigbench/phrase_relatedness                                          | tasksource/bigbench                          | phrase_relatedness                                  |                 | bigbench                                     | MultipleChoice      |\n| 141 | bigbench/penguins_in_a_table                                         | tasksource/bigbench                          | penguins_in_a_table                                 |                 | bigbench                                     | MultipleChoice      |\n| 142 | bigbench/human_organs_senses                                         | tasksource/bigbench                          | human_organs_senses                                 |                 | bigbench                                     | MultipleChoice      |\n| 143 | bigbench/logical_deduction                                           | tasksource/bigbench                          | logical_deduction                                   |                 | bigbench                                     | MultipleChoice      |\n| 144 | bigbench/intent_recognition                                          | tasksource/bigbench                          | intent_recognition                                  |                 | bigbench                                     | MultipleChoice      |\n| 145 | bigbench/strategyqa                                                  | tasksource/bigbench                          | strategyqa                                          |                 | bigbench                                     | MultipleChoice      |\n| 146 | bigbench/discourse_marker_prediction                                 | tasksource/bigbench                          | discourse_marker_prediction                         |                 | bigbench                                     | MultipleChoice      |\n| 147 | bigbench/metaphor_boolean                                            | tasksource/bigbench                          | metaphor_boolean                                    |                 | bigbench                                     | MultipleChoice      |\n| 148 | bigbench/sports_understanding                                        | tasksource/bigbench                          | sports_understanding                                |                 | bigbench                                     | MultipleChoice      |\n| 149 | bigbench/mnist_ascii                                                 | tasksource/bigbench                          | mnist_ascii                                         |                 | bigbench                                     | MultipleChoice      |\n| 150 | bigbench/authorship_verification                                     | tasksource/bigbench                          | authorship_verification                             |                 | bigbench                                     | MultipleChoice      |\n| 151 | bigbench/question_selection                                          | tasksource/bigbench                          | question_selection                                  |                 | bigbench                                     | MultipleChoice      |\n| 152 | bigbench/code_line_description                                       | tasksource/bigbench                          | code_line_description                               |                 | bigbench                                     | MultipleChoice      |\n| 153 | bigbench/similarities_abstraction                                    | tasksource/bigbench                          | similarities_abstraction                            |                 | bigbench                                     | MultipleChoice      |\n| 154 | bigbench/simple_ethical_questions                                    | tasksource/bigbench                          | simple_ethical_questions                            |                 | bigbench                                     | MultipleChoice      |\n| 155 | bigbench/date_understanding                                          | tasksource/bigbench                          | date_understanding                                  |                 | bigbench                                     | MultipleChoice      |\n| 156 | bigbench/novel_concepts                                              | tasksource/bigbench                          | novel_concepts                                      |                 | bigbench                                     | MultipleChoice      |\n| 157 | bigbench/hindu_knowledge                                             | tasksource/bigbench                          | hindu_knowledge                                     |                 | bigbench                                     | MultipleChoice      |\n| 158 | bigbench/vitaminc_fact_verification                                  | tasksource/bigbench                          | vitaminc_fact_verification                          |                 | bigbench                                     | MultipleChoice      |\n| 159 | bigbench/tracking_shuffled_objects                                   | tasksource/bigbench                          | tracking_shuffled_objects                           |                 | bigbench                                     | MultipleChoice      |\n| 160 | bigbench/logical_fallacy_detection                                   | tasksource/bigbench                          | logical_fallacy_detection                           |                 | bigbench                                     | MultipleChoice      |\n| 161 | bigbench/dyck_languages                                              | tasksource/bigbench                          | dyck_languages                                      |                 | bigbench                                     | MultipleChoice      |\n| 162 | bigbench/geometric_shapes                                            | tasksource/bigbench                          | geometric_shapes                                    |                 | bigbench                                     | MultipleChoice      |\n| 163 | bigbench/crass_ai                                                    | tasksource/bigbench                          | crass_ai                                            |                 | bigbench                                     | MultipleChoice      |\n| 164 | bigbench/checkmate_in_one                                            | tasksource/bigbench                          | checkmate_in_one                                    |                 | bigbench                                     | MultipleChoice      |\n| 165 | bigbench/causal_judgment                                             | tasksource/bigbench                          | causal_judgment                                     |                 | bigbench                                     | MultipleChoice      |\n| 166 | bigbench/elementary_math_qa                                          | tasksource/bigbench                          | elementary_math_qa                                  |                 | bigbench                                     | MultipleChoice      |\n| 167 | bigbench/mathematical_induction                                      | tasksource/bigbench                          | mathematical_induction                              |                 | bigbench                                     | MultipleChoice      |\n| 168 | bigbench/fantasy_reasoning                                           | tasksource/bigbench                          | fantasy_reasoning                                   |                 | bigbench                                     | MultipleChoice      |\n| 169 | bigbench/anachronisms                                                | tasksource/bigbench                          | anachronisms                                        |                 | bigbench                                     | MultipleChoice      |\n| 170 | bigbench/disambiguation_qa                                           | tasksource/bigbench                          | disambiguation_qa                                   |                 | bigbench                                     | MultipleChoice      |\n| 171 | bigbench/understanding_fables                                        | tasksource/bigbench                          | understanding_fables                                |                 | bigbench                                     | MultipleChoice      |\n| 172 | bigbench/key_value_maps                                              | tasksource/bigbench                          | key_value_maps                                      |                 | bigbench                                     | MultipleChoice      |\n| 173 | bigbench/arithmetic                                                  | tasksource/bigbench                          | arithmetic                                          |                 | bigbench                                     | MultipleChoice      |\n| 174 | bigbench/logic_grid_puzzle                                           | tasksource/bigbench                          | logic_grid_puzzle                                   |                 | bigbench                                     | MultipleChoice      |\n| 175 | bigbench/snarks                                                      | tasksource/bigbench                          | snarks                                              |                 | bigbench                                     | MultipleChoice      |\n| 176 | bigbench/movie_recommendation                                        | tasksource/bigbench                          | movie_recommendation                                |                 | bigbench                                     | MultipleChoice      |\n| 177 | bigbench/color                                                       | tasksource/bigbench                          | color                                               |                 | bigbench                                     | MultipleChoice      |\n| 178 | bigbench/undo_permutation                                            | tasksource/bigbench                          | undo_permutation                                    |                 | bigbench                                     | MultipleChoice      |\n| 179 | bigbench/contextual_parametric_knowledge_conflicts                   | tasksource/bigbench                          | contextual_parametric_knowledge_conflicts           |                 | bigbench                                     | MultipleChoice      |\n| 180 | bigbench/temporal_sequences                                          | tasksource/bigbench                          | temporal_sequences                                  |                 | bigbench                                     | MultipleChoice      |\n| 181 | bigbench/misconceptions                                              | tasksource/bigbench                          | misconceptions                                      |                 | bigbench                                     | MultipleChoice      |\n| 182 | bigbench/analogical_similarity                                       | tasksource/bigbench                          | analogical_similarity                               |                 | bigbench                                     | MultipleChoice      |\n| 183 | bigbench/timedial                                                    | tasksource/bigbench                          | timedial                                            |                 | bigbench                                     | MultipleChoice      |\n| 184 | bigbench/winowhy                                                     | tasksource/bigbench                          | winowhy                                             |                 | bigbench                                     | MultipleChoice      |\n| 185 | bigbench/social_iqa                                                  | tasksource/bigbench                          | social_iqa                                          |                 | bigbench                                     | MultipleChoice      |\n| 186 | bigbench/riddle_sense                                                | tasksource/bigbench                          | riddle_sense                                        |                 | bigbench                                     | MultipleChoice      |\n| 187 | bigbench/irony_identification                                        | tasksource/bigbench                          | irony_identification                                |                 | bigbench                                     | MultipleChoice      |\n| 188 | bigbench/goal_step_wikihow                                           | tasksource/bigbench                          | goal_step_wikihow                                   |                 | bigbench                                     | MultipleChoice      |\n| 189 | bigbench/symbol_interpretation                                       | tasksource/bigbench                          | symbol_interpretation                               |                 | bigbench                                     | MultipleChoice      |\n| 190 | bigbench/hhh_alignment                                               | tasksource/bigbench                          | hhh_alignment                                       |                 | bigbench                                     | MultipleChoice      |\n| 191 | bigbench/cs_algorithms                                               | tasksource/bigbench                          | cs_algorithms                                       |                 | bigbench                                     | MultipleChoice      |\n| 192 | bigbench/emoji_movie                                                 | tasksource/bigbench                          | emoji_movie                                         |                 | bigbench                                     | MultipleChoice      |\n| 193 | bigbench/abstract_narrative_understanding                            | tasksource/bigbench                          | abstract_narrative_understanding                    |                 | bigbench                                     | MultipleChoice      |\n| 194 | bigbench/navigate                                                    | tasksource/bigbench                          | navigate                                            |                 | bigbench                                     | MultipleChoice      |\n| 195 | bigbench/cifar10_classification                                      | tasksource/bigbench                          | cifar10_classification                              |                 | bigbench                                     | MultipleChoice      |\n| 196 | bigbench/implicit_relations                                          | tasksource/bigbench                          | implicit_relations                                  |                 | bigbench                                     | MultipleChoice      |\n| 197 | bigbench/real_or_fake_text                                           | tasksource/bigbench                          | real_or_fake_text                                   |                 | bigbench                                     | MultipleChoice      |\n| 198 | bigbench/unit_interpretation                                         | tasksource/bigbench                          | unit_interpretation                                 |                 | bigbench                                     | MultipleChoice      |\n| 199 | bigbench/reasoning_about_colored_objects                             | tasksource/bigbench                          | reasoning_about_colored_objects                     |                 | bigbench                                     | MultipleChoice      |\n| 200 | bigbench/nonsense_words_grammar                                      | tasksource/bigbench                          | nonsense_words_grammar                              |                 | bigbench                                     | MultipleChoice      |\n| 201 | bigbench/salient_translation_error_detection                         | tasksource/bigbench                          | salient_translation_error_detection                 |                 | bigbench                                     | MultipleChoice      |\n| 202 | bigbench/implicatures                                                | tasksource/bigbench                          | implicatures                                        |                 | bigbench                                     | MultipleChoice      |\n| 203 | bigbench/entailed_polarity                                           | tasksource/bigbench                          | entailed_polarity                                   |                 | bigbench                                     | MultipleChoice      |\n| 204 | bigbench/physics                                                     | tasksource/bigbench                          | physics                                             |                 | bigbench                                     | MultipleChoice      |\n| 205 | bigbench/cause_and_effect                                            | tasksource/bigbench                          | cause_and_effect                                    |                 | bigbench                                     | MultipleChoice      |\n| 206 | bigbench/strange_stories                                             | tasksource/bigbench                          | strange_stories                                     |                 | bigbench                                     | MultipleChoice      |\n| 207 | bigbench/epistemic_reasoning                                         | tasksource/bigbench                          | epistemic_reasoning                                 |                 | bigbench                                     | MultipleChoice      |\n| 208 | bigbench/general_knowledge                                           | tasksource/bigbench                          | general_knowledge                                   |                 | bigbench                                     | MultipleChoice      |\n| 209 | bigbench/odd_one_out                                                 | tasksource/bigbench                          | odd_one_out                                         |                 | bigbench                                     | MultipleChoice      |\n| 210 | bigbench/figure_of_speech_detection                                  | tasksource/bigbench                          | figure_of_speech_detection                          |                 | bigbench                                     | MultipleChoice      |\n| 211 | bigbench/ruin_names                                                  | tasksource/bigbench                          | ruin_names                                          |                 | bigbench                                     | MultipleChoice      |\n| 212 | bigbench/sentence_ambiguity                                          | tasksource/bigbench                          | sentence_ambiguity                                  |                 | bigbench                                     | MultipleChoice      |\n| 213 | bigbench/dark_humor_detection                                        | tasksource/bigbench                          | dark_humor_detection                                |                 | bigbench                                     | MultipleChoice      |\n| 214 | blimp/wh_vs_that_with_gap                                            | blimp                                        | wh_vs_that_with_gap                                 |                 | blimp_hard                                   | MultipleChoice      |\n| 215 | blimp/sentential_negation_npi_scope                                  | blimp                                        | sentential_negation_npi_scope                       |                 | blimp_hard                                   | MultipleChoice      |\n| 216 | blimp/superlative_quantifiers_1                                      | blimp                                        | superlative_quantifiers_1                           |                 | blimp_hard                                   | MultipleChoice      |\n| 217 | blimp/wh_questions_object_gap                                        | blimp                                        | wh_questions_object_gap                             |                 | blimp_hard                                   | MultipleChoice      |\n| 218 | blimp/coordinate_structure_constraint_object_extraction              | blimp                                        | coordinate_structure_constraint_object_extraction   |                 | blimp_hard                                   | MultipleChoice      |\n| 219 | blimp/coordinate_structure_constraint_complex_left_branch            | blimp                                        | coordinate_structure_constraint_complex_left_branch |                 | blimp_hard                                   | MultipleChoice      |\n| 220 | blimp/existential_there_quantifiers_2                                | blimp                                        | existential_there_quantifiers_2                     |                 | blimp_hard                                   | MultipleChoice      |\n| 221 | blimp/drop_argument                                                  | blimp                                        | drop_argument                                       |                 | blimp_hard                                   | MultipleChoice      |\n| 222 | blimp/wh_questions_subject_gap_long_distance                         | blimp                                        | wh_questions_subject_gap_long_distance              |                 | blimp_hard                                   | MultipleChoice      |\n| 223 | blimp/matrix_question_npi_licensor_present                           | blimp                                        | matrix_question_npi_licensor_present                |                 | blimp_hard                                   | MultipleChoice      |\n| 224 | blimp/principle_A_c_command                                          | blimp                                        | principle_A_c_command                               |                 | blimp_hard                                   | MultipleChoice      |\n| 225 | blimp/animate_subject_passive                                        | blimp                                        | animate_subject_passive                             |                 | blimp_hard                                   | MultipleChoice      |\n| 226 | blimp/tough_vs_raising_1                                             | blimp                                        | tough_vs_raising_1                                  |                 | blimp_hard                                   | MultipleChoice      |\n| 227 | blimp/npi_present_1                                                  | blimp                                        | npi_present_1                                       |                 | blimp_hard                                   | MultipleChoice      |\n| 228 | blimp/sentential_subject_island                                      | blimp                                        | sentential_subject_island                           |                 | blimp_hard                                   | MultipleChoice      |\n| 229 | blimp/npi_present_2                                                  | blimp                                        | npi_present_2                                       |                 | blimp_hard                                   | MultipleChoice      |\n| 230 | blimp/inchoative                                                     | blimp                                        | inchoative                                          |                 | blimp_hard                                   | MultipleChoice      |\n| 231 | blimp/wh_vs_that_with_gap_long_distance                              | blimp                                        | wh_vs_that_with_gap_long_distance                   |                 | blimp_hard                                   | MultipleChoice      |\n| 232 | blimp/principle_A_reconstruction                                     | blimp                                        | principle_A_reconstruction                          |                 | blimp_hard                                   | MultipleChoice      |\n| 233 | blimp/complex_NP_island                                              | blimp                                        | complex_NP_island                                   |                 | blimp_hard                                   | MultipleChoice      |\n| 234 | blimp/left_branch_island_echo_question                               | blimp                                        | left_branch_island_echo_question                    |                 | blimp_hard                                   | MultipleChoice      |\n| 235 | blimp/principle_A_domain_2                                           | blimp                                        | principle_A_domain_2                                |                 | blimp_hard                                   | MultipleChoice      |\n| 236 | cos_e/v1.0                                                           | cos_e                                        | v1.0                                                |                 | cos_e                                        | MultipleChoice      |\n| 237 | cosmos_qa                                                            | cosmos_qa                                    |                                                     |                 | cosmos_qa                                    | MultipleChoice      |\n| 238 | dream                                                                | dream                                        |                                                     |                 | dream                                        | MultipleChoice      |\n| 239 | openbookqa                                                           | openbookqa                                   |                                                     |                 | openbookqa                                   | MultipleChoice      |\n| 240 | qasc                                                                 | qasc                                         |                                                     |                 | qasc                                         | MultipleChoice      |\n| 241 | quartz                                                               | quartz                                       |                                                     |                 | quartz                                       | MultipleChoice      |\n| 242 | quail                                                                | quail                                        |                                                     |                 | quail                                        | MultipleChoice      |\n| 243 | head_qa/en                                                           | head_qa                                      | en                                                  |                 | head_qa___en                                 | MultipleChoice      |\n| 244 | sciq                                                                 | sciq                                         |                                                     |                 | sciq                                         | MultipleChoice      |\n| 245 | social_i_qa                                                          | social_i_qa                                  |                                                     |                 | social_i_qa                                  | MultipleChoice      |\n| 246 | wiki_hop/original                                                    | wiki_hop                                     | original                                            |                 | wiki_hop___original                          | MultipleChoice      |\n| 247 | wiqa                                                                 | wiqa                                         |                                                     |                 | wiqa                                         | MultipleChoice      |\n| 248 | piqa                                                                 | piqa                                         |                                                     |                 | piqa                                         | MultipleChoice      |\n| 249 | hellaswag                                                            | hellaswag                                    |                                                     |                 | hellaswag                                    | MultipleChoice      |\n| 250 | super_glue/copa                                                      | super_glue                                   | copa                                                |                 | super_glue___copa                            | MultipleChoice      |\n| 251 | balanced-copa                                                        | pkavumba/balanced-copa                       |                                                     |                 | balanced_copa                                | MultipleChoice      |\n| 252 | e-CARE                                                               | 12ml/e-CARE                                  |                                                     |                 | e_care                                       | MultipleChoice      |\n| 253 | art                                                                  | art                                          |                                                     |                 | art                                          | MultipleChoice      |\n| 254 | mmlu/marketing                                                       | tasksource/mmlu                              | marketing                                           |                 | mmlu                                         | MultipleChoice      |\n| 255 | mmlu/high_school_government_and_politics                             | tasksource/mmlu                              | high_school_government_and_politics                 |                 | mmlu                                         | MultipleChoice      |\n| 256 | mmlu/high_school_macroeconomics                                      | tasksource/mmlu                              | high_school_macroeconomics                          |                 | mmlu                                         | MultipleChoice      |\n| 257 | mmlu/medical_genetics                                                | tasksource/mmlu                              | medical_genetics                                    |                 | mmlu                                         | MultipleChoice      |\n| 258 | mmlu/miscellaneous                                                   | tasksource/mmlu                              | miscellaneous                                       |                 | mmlu                                         | MultipleChoice      |\n| 259 | mmlu/moral_disputes                                                  | tasksource/mmlu                              | moral_disputes                                      |                 | mmlu                                         | MultipleChoice      |\n| 260 | mmlu/moral_scenarios                                                 | tasksource/mmlu                              | moral_scenarios                                     |                 | mmlu                                         | MultipleChoice      |\n| 261 | mmlu/nutrition                                                       | tasksource/mmlu                              | nutrition                                           |                 | mmlu                                         | MultipleChoice      |\n| 262 | mmlu/philosophy                                                      | tasksource/mmlu                              | philosophy                                          |                 | mmlu                                         | MultipleChoice      |\n| 263 | mmlu/professional_law                                                | tasksource/mmlu                              | professional_law                                    |                 | mmlu                                         | MultipleChoice      |\n| 264 | mmlu/professional_medicine                                           | tasksource/mmlu                              | professional_medicine                               |                 | mmlu                                         | MultipleChoice      |\n| 265 | mmlu/professional_psychology                                         | tasksource/mmlu                              | professional_psychology                             |                 | mmlu                                         | MultipleChoice      |\n| 266 | mmlu/public_relations                                                | tasksource/mmlu                              | public_relations                                    |                 | mmlu                                         | MultipleChoice      |\n| 267 | mmlu/security_studies                                                | tasksource/mmlu                              | security_studies                                    |                 | mmlu                                         | MultipleChoice      |\n| 268 | mmlu/sociology                                                       | tasksource/mmlu                              | sociology                                           |                 | mmlu                                         | MultipleChoice      |\n| 269 | mmlu/us_foreign_policy                                               | tasksource/mmlu                              | us_foreign_policy                                   |                 | mmlu                                         | MultipleChoice      |\n| 270 | mmlu/anatomy                                                         | tasksource/mmlu                              | anatomy                                             |                 | mmlu                                         | MultipleChoice      |\n| 271 | mmlu/astronomy                                                       | tasksource/mmlu                              | astronomy                                           |                 | mmlu                                         | MultipleChoice      |\n| 272 | mmlu/business_ethics                                                 | tasksource/mmlu                              | business_ethics                                     |                 | mmlu                                         | MultipleChoice      |\n| 273 | mmlu/jurisprudence                                                   | tasksource/mmlu                              | jurisprudence                                       |                 | mmlu                                         | MultipleChoice      |\n| 274 | mmlu/logical_fallacies                                               | tasksource/mmlu                              | logical_fallacies                                   |                 | mmlu                                         | MultipleChoice      |\n| 275 | mmlu/machine_learning                                                | tasksource/mmlu                              | machine_learning                                    |                 | mmlu                                         | MultipleChoice      |\n| 276 | mmlu/management                                                      | tasksource/mmlu                              | management                                          |                 | mmlu                                         | MultipleChoice      |\n| 277 | mmlu/econometrics                                                    | tasksource/mmlu                              | econometrics                                        |                 | mmlu                                         | MultipleChoice      |\n| 278 | mmlu/college_medicine                                                | tasksource/mmlu                              | college_medicine                                    |                 | mmlu                                         | MultipleChoice      |\n| 279 | mmlu/college_physics                                                 | tasksource/mmlu                              | college_physics                                     |                 | mmlu                                         | MultipleChoice      |\n| 280 | mmlu/computer_security                                               | tasksource/mmlu                              | computer_security                                   |                 | mmlu                                         | MultipleChoice      |\n| 281 | mmlu/conceptual_physics                                              | tasksource/mmlu                              | conceptual_physics                                  |                 | mmlu                                         | MultipleChoice      |\n| 282 | mmlu/electrical_engineering                                          | tasksource/mmlu                              | electrical_engineering                              |                 | mmlu                                         | MultipleChoice      |\n| 283 | mmlu/human_sexuality                                                 | tasksource/mmlu                              | human_sexuality                                     |                 | mmlu                                         | MultipleChoice      |\n| 284 | mmlu/international_law                                               | tasksource/mmlu                              | international_law                                   |                 | mmlu                                         | MultipleChoice      |\n| 285 | mmlu/elementary_mathematics                                          | tasksource/mmlu                              | elementary_mathematics                              |                 | mmlu                                         | MultipleChoice      |\n| 286 | mmlu/prehistory                                                      | tasksource/mmlu                              | prehistory                                          |                 | mmlu                                         | MultipleChoice      |\n| 287 | mmlu/high_school_world_history                                       | tasksource/mmlu                              | high_school_world_history                           |                 | mmlu                                         | MultipleChoice      |\n| 288 | mmlu/human_aging                                                     | tasksource/mmlu                              | human_aging                                         |                 | mmlu                                         | MultipleChoice      |\n| 289 | mmlu/abstract_algebra                                                | tasksource/mmlu                              | abstract_algebra                                    |                 | mmlu                                         | MultipleChoice      |\n| 290 | mmlu/clinical_knowledge                                              | tasksource/mmlu                              | clinical_knowledge                                  |                 | mmlu                                         | MultipleChoice      |\n| 291 | mmlu/college_biology                                                 | tasksource/mmlu                              | college_biology                                     |                 | mmlu                                         | MultipleChoice      |\n| 292 | mmlu/college_chemistry                                               | tasksource/mmlu                              | college_chemistry                                   |                 | mmlu                                         | MultipleChoice      |\n| 293 | mmlu/virology                                                        | tasksource/mmlu                              | virology                                            |                 | mmlu                                         | MultipleChoice      |\n| 294 | mmlu/world_religions                                                 | tasksource/mmlu                              | world_religions                                     |                 | mmlu                                         | MultipleChoice      |\n| 295 | mmlu/professional_accounting                                         | tasksource/mmlu                              | professional_accounting                             |                 | mmlu                                         | MultipleChoice      |\n| 296 | mmlu/global_facts                                                    | tasksource/mmlu                              | global_facts                                        |                 | mmlu                                         | MultipleChoice      |\n| 297 | mmlu/high_school_biology                                             | tasksource/mmlu                              | high_school_biology                                 |                 | mmlu                                         | MultipleChoice      |\n| 298 | mmlu/high_school_chemistry                                           | tasksource/mmlu                              | high_school_chemistry                               |                 | mmlu                                         | MultipleChoice      |\n| 299 | mmlu/high_school_european_history                                    | tasksource/mmlu                              | high_school_european_history                        |                 | mmlu                                         | MultipleChoice      |\n| 300 | mmlu/formal_logic                                                    | tasksource/mmlu                              | formal_logic                                        |                 | mmlu                                         | MultipleChoice      |\n| 301 | mmlu/high_school_us_history                                          | tasksource/mmlu                              | high_school_us_history                              |                 | mmlu                                         | MultipleChoice      |\n| 302 | mmlu/high_school_statistics                                          | tasksource/mmlu                              | high_school_statistics                              |                 | mmlu                                         | MultipleChoice      |\n| 303 | mmlu/high_school_psychology                                          | tasksource/mmlu                              | high_school_psychology                              |                 | mmlu                                         | MultipleChoice      |\n| 304 | mmlu/high_school_physics                                             | tasksource/mmlu                              | high_school_physics                                 |                 | mmlu                                         | MultipleChoice      |\n| 305 | mmlu/high_school_microeconomics                                      | tasksource/mmlu                              | high_school_microeconomics                          |                 | mmlu                                         | MultipleChoice      |\n| 306 | mmlu/high_school_mathematics                                         | tasksource/mmlu                              | high_school_mathematics                             |                 | mmlu                                         | MultipleChoice      |\n| 307 | mmlu/college_mathematics                                             | tasksource/mmlu                              | college_mathematics                                 |                 | mmlu                                         | MultipleChoice      |\n| 308 | mmlu/college_computer_science                                        | tasksource/mmlu                              | college_computer_science                            |                 | mmlu                                         | MultipleChoice      |\n| 309 | mmlu/high_school_geography                                           | tasksource/mmlu                              | high_school_geography                               |                 | mmlu                                         | MultipleChoice      |\n| 310 | mmlu/high_school_computer_science                                    | tasksource/mmlu                              | high_school_computer_science                        |                 | mmlu                                         | MultipleChoice      |\n| 311 | winogrande/winogrande_xl                                             | winogrande                                   | winogrande_xl                                       |                 | winogrande                                   | MultipleChoice      |\n| 312 | codah/codah                                                          | codah                                        | codah                                               |                 | codah                                        | MultipleChoice      |\n| 313 | ai2_arc/ARC-Challenge/challenge                                      | ai2_arc                                      | ARC-Challenge                                       | challenge       | ai2_arc__challenge                           | MultipleChoice      |\n| 314 | ai2_arc/ARC-Easy/challenge                                           | ai2_arc                                      | ARC-Easy                                            | challenge       | ai2_arc__challenge                           | MultipleChoice      |\n| 315 | definite_pronoun_resolution                                          | definite_pronoun_resolution                  |                                                     |                 | definite_pronoun_resolution                  | MultipleChoice      |\n| 316 | swag/regular                                                         | swag                                         | regular                                             |                 | swag___regular                               | MultipleChoice      |\n| 317 | math_qa                                                              | math_qa                                      |                                                     |                 | math_qa                                      | MultipleChoice      |\n| 318 | glue/cola                                                            | glue                                         | cola                                                |                 | glue___cola                                  | Classification      |\n| 319 | glue/sst2                                                            | glue                                         | sst2                                                |                 | glue___sst2                                  | Classification      |\n| 320 | utilitarianism                                                       | metaeval/utilitarianism                      |                                                     |                 | utilitarianism                               | Classification      |\n| 321 | amazon_counterfactual/en                                             | mteb/amazon_counterfactual                   | en                                                  |                 | amazon_counterfactual                        | Classification      |\n| 322 | insincere-questions                                                  | SetFit/insincere-questions                   |                                                     |                 | insincere_questions                          | Classification      |\n| 323 | toxic_conversations                                                  | SetFit/toxic_conversations                   |                                                     |                 | toxic_conversations                          | Classification      |\n| 324 | TuringBench                                                          | turingbench/TuringBench                      |                                                     |                 | turingbench                                  | Classification      |\n| 325 | trec                                                                 | trec                                         |                                                     |                 | trec                                         | Classification      |\n| 326 | vitaminc                                                             | tals/vitaminc                                |                                                     |                 | tals_vitaminc                                | Classification      |\n| 327 | hope_edi/english                                                     | hope_edi                                     | english                                             |                 | hope_edi                                     | Classification      |\n| 328 | rumoureval_2019/RumourEval2019                                       | strombergnlp/rumoureval_2019                 | RumourEval2019                                      |                 | rumoureval_2019                              | Classification      |\n| 329 | ethos/binary                                                         | ethos                                        | binary                                              |                 | ethos___binary                               | Classification      |\n| 330 | ethos/multilabel                                                     | ethos                                        | multilabel                                          |                 | ethos___multilabel                           | Classification      |\n| 331 | tweet_eval/irony                                                     | tweet_eval                                   | irony                                               |                 | tweet_eval                                   | Classification      |\n| 332 | tweet_eval/sentiment                                                 | tweet_eval                                   | sentiment                                           |                 | tweet_eval                                   | Classification      |\n| 333 | tweet_eval/emotion                                                   | tweet_eval                                   | emotion                                             |                 | tweet_eval                                   | Classification      |\n| 334 | tweet_eval/emoji                                                     | tweet_eval                                   | emoji                                               |                 | tweet_eval                                   | Classification      |\n| 335 | tweet_eval/hate                                                      | tweet_eval                                   | hate                                                |                 | tweet_eval                                   | Classification      |\n| 336 | tweet_eval/offensive                                                 | tweet_eval                                   | offensive                                           |                 | tweet_eval                                   | Classification      |\n| 337 | tweet_eval/stance_abortion                                           | tweet_eval                                   | stance_abortion                                     |                 | tweet_eval_abortion                          | Classification      |\n| 338 | tweet_eval/stance_atheism                                            | tweet_eval                                   | stance_atheism                                      |                 | tweet_eval_atheism                           | Classification      |\n| 339 | tweet_eval/stance_climate                                            | tweet_eval                                   | stance_climate                                      |                 | tweet_eval_climate                           | Classification      |\n| 340 | tweet_eval/stance_feminist                                           | tweet_eval                                   | stance_feminist                                     |                 | tweet_eval_feminist                          | Classification      |\n| 341 | tweet_eval/stance_hillary                                            | tweet_eval                                   | stance_hillary                                      |                 | tweet_eval_hillary                           | Classification      |\n| 342 | discovery/discovery                                                  | discovery                                    | discovery                                           |                 | discovery                                    | Classification      |\n| 343 | pragmeval/squinky-formality                                          | pragmeval                                    | squinky-formality                                   |                 | pragmeval_1                                  | Classification      |\n| 344 | pragmeval/switchboard                                                | pragmeval                                    | switchboard                                         |                 | pragmeval_1                                  | Classification      |\n| 345 | pragmeval/mrda                                                       | pragmeval                                    | mrda                                                |                 | pragmeval_1                                  | Classification      |\n| 346 | pragmeval/squinky-informativeness                                    | pragmeval                                    | squinky-informativeness                             |                 | pragmeval_1                                  | Classification      |\n| 347 | pragmeval/squinky-implicature                                        | pragmeval                                    | squinky-implicature                                 |                 | pragmeval_1                                  | Classification      |\n| 348 | pragmeval/emobank-valence                                            | pragmeval                                    | emobank-valence                                     |                 | pragmeval_1                                  | Classification      |\n| 349 | pragmeval/emobank-dominance                                          | pragmeval                                    | emobank-dominance                                   |                 | pragmeval_1                                  | Classification      |\n| 350 | pragmeval/verifiability                                              | pragmeval                                    | verifiability                                       |                 | pragmeval_1                                  | Classification      |\n| 351 | pragmeval/emobank-arousal                                            | pragmeval                                    | emobank-arousal                                     |                 | pragmeval_1                                  | Classification      |\n| 352 | pragmeval/persuasiveness-specificity                                 | pragmeval                                    | persuasiveness-specificity                          |                 | pragmeval_2                                  | Classification      |\n| 353 | pragmeval/persuasiveness-strength                                    | pragmeval                                    | persuasiveness-strength                             |                 | pragmeval_2                                  | Classification      |\n| 354 | pragmeval/sarcasm                                                    | pragmeval                                    | sarcasm                                             |                 | pragmeval_2                                  | Classification      |\n| 355 | pragmeval/stac                                                       | pragmeval                                    | stac                                                |                 | pragmeval_2                                  | Classification      |\n| 356 | pragmeval/pdtb                                                       | pragmeval                                    | pdtb                                                |                 | pragmeval_2                                  | Classification      |\n| 357 | pragmeval/emergent                                                   | pragmeval                                    | emergent                                            |                 | pragmeval_2                                  | Classification      |\n| 358 | pragmeval/gum                                                        | pragmeval                                    | gum                                                 |                 | pragmeval_2                                  | Classification      |\n| 359 | pragmeval/persuasiveness-claimtype                                   | pragmeval                                    | persuasiveness-claimtype                            |                 | pragmeval_2                                  | Classification      |\n| 360 | pragmeval/persuasiveness-eloquence                                   | pragmeval                                    | persuasiveness-eloquence                            |                 | pragmeval_2                                  | Classification      |\n| 361 | pragmeval/persuasiveness-premisetype                                 | pragmeval                                    | persuasiveness-premisetype                          |                 | pragmeval_2                                  | Classification      |\n| 362 | pragmeval/persuasiveness-relevance                                   | pragmeval                                    | persuasiveness-relevance                            |                 | pragmeval_2                                  | Classification      |\n| 363 | silicone/iemocap                                                     | silicone                                     | iemocap                                             |                 | silicone                                     | Classification      |\n| 364 | silicone/dyda_e                                                      | silicone                                     | dyda_e                                              |                 | silicone                                     | Classification      |\n| 365 | silicone/sem                                                         | silicone                                     | sem                                                 |                 | silicone                                     | Classification      |\n| 366 | silicone/dyda_da                                                     | silicone                                     | dyda_da                                             |                 | silicone                                     | Classification      |\n| 367 | silicone/oasis                                                       | silicone                                     | oasis                                               |                 | silicone                                     | Classification      |\n| 368 | silicone/maptask                                                     | silicone                                     | maptask                                             |                 | silicone                                     | Classification      |\n| 369 | silicone/meld_e                                                      | silicone                                     | meld_e                                              |                 | silicone                                     | Classification      |\n| 370 | silicone/meld_s                                                      | silicone                                     | meld_s                                              |                 | silicone                                     | Classification      |\n| 371 | lex_glue/eurlex                                                      | lex_glue                                     | eurlex                                              |                 | lex_glue___eurlex                            | Classification      |\n| 372 | lex_glue/scotus                                                      | lex_glue                                     | scotus                                              |                 | lex_glue___scotus                            | Classification      |\n| 373 | lex_glue/ledgar                                                      | lex_glue                                     | ledgar                                              |                 | lex_glue___ledgar                            | Classification      |\n| 374 | lex_glue/unfair_tos                                                  | lex_glue                                     | unfair_tos                                          |                 | lex_glue___unfair_tos                        | Classification      |\n| 375 | lex_glue/case_hold                                                   | lex_glue                                     | case_hold                                           |                 | lex_glue___case_hold                         | MultipleChoice      |\n| 376 | language-identification                                              | papluca/language-identification              |                                                     |                 | language_identification                      | Classification      |\n| 377 | imdb                                                                 | imdb                                         |                                                     |                 | imdb                                         | Classification      |\n| 378 | rotten_tomatoes                                                      | rotten_tomatoes                              |                                                     |                 | rotten_tomatoes                              | Classification      |\n| 379 | ag_news                                                              | ag_news                                      |                                                     |                 | ag_news                                      | Classification      |\n| 380 | yelp_review_full/yelp_review_full                                    | yelp_review_full                             | yelp_review_full                                    |                 | yelp_review_full                             | Classification      |\n| 381 | financial_phrasebank/sentences_allagree                              | financial_phrasebank                         | sentences_allagree                                  |                 | financial_phrasebank                         | Classification      |\n| 382 | poem_sentiment                                                       | poem_sentiment                               |                                                     |                 | poem_sentiment                               | Classification      |\n| 383 | dbpedia_14/dbpedia_14                                                | dbpedia_14                                   | dbpedia_14                                          |                 | dbpedia_14                                   | Classification      |\n| 384 | amazon_polarity/amazon_polarity                                      | amazon_polarity                              | amazon_polarity                                     |                 | amazon_polarity                              | Classification      |\n| 385 | app_reviews                                                          | app_reviews                                  |                                                     |                 | app_reviews                                  | Classification      |\n| 386 | hate_speech18                                                        | hate_speech18                                |                                                     |                 | hate_speech18                                | Classification      |\n| 387 | sms_spam                                                             | sms_spam                                     |                                                     |                 | sms_spam                                     | Classification      |\n| 388 | humicroedit/subtask-1                                                | humicroedit                                  | subtask-1                                           |                 | humicroedit___subtask_1                      | Classification      |\n| 389 | humicroedit/subtask-2                                                | humicroedit                                  | subtask-2                                           |                 | humicroedit___subtask_2                      | Classification      |\n| 390 | snips_built_in_intents                                               | snips_built_in_intents                       |                                                     |                 | snips_built_in_intents                       | Classification      |\n| 391 | hate_speech_offensive                                                | hate_speech_offensive                        |                                                     |                 | hate_speech_offensive                        | Classification      |\n| 392 | yahoo_answers_topics                                                 | yahoo_answers_topics                         |                                                     |                 | yahoo_answers_topics                         | Classification      |\n| 393 | stackoverflow-questions                                              | pacovaldez/stackoverflow-questions           |                                                     |                 | stackoverflow_questions                      | Classification      |\n| 394 | hyperpartisan_news                                                   | zapsdcn/hyperpartisan_news                   |                                                     |                 | hyperpartisan_news                           | Classification      |\n| 395 | sciie                                                                | zapsdcn/sciie                                |                                                     |                 | scierc                                       | Classification      |\n| 396 | citation_intent                                                      | zapsdcn/citation_intent                      |                                                     |                 | citation_intent                              | Classification      |\n| 397 | go_emotions/simplified                                               | go_emotions                                  | simplified                                          |                 | go_emotions___simplified                     | Classification      |\n| 398 | scicite                                                              | allenai/scicite                              |                                                     |                 | scicite                                      | Classification      |\n| 399 | liar                                                                 | liar                                         |                                                     |                 | liar                                         | Classification      |\n| 400 | lexical_relation_classification/ROOT09                               | relbert/lexical_relation_classification      | ROOT09                                              |                 | relbert_lexical_relation_classification      | Classification      |\n| 401 | lexical_relation_classification/K&H+N                                | relbert/lexical_relation_classification      | K&H+N                                               |                 | relbert_lexical_relation_classification      | Classification      |\n| 402 | lexical_relation_classification/CogALexV                             | relbert/lexical_relation_classification      | CogALexV                                            |                 | relbert_lexical_relation_classification      | Classification      |\n| 403 | lexical_relation_classification/BLESS                                | relbert/lexical_relation_classification      | BLESS                                               |                 | relbert_lexical_relation_classification      | Classification      |\n| 404 | lexical_relation_classification/EVALution                            | relbert/lexical_relation_classification      | EVALution                                           |                 | relbert_lexical_relation_classification      | Classification      |\n| 405 | linguisticprobing/coordination_inversion                             | tasksource/linguisticprobing                 | coordination_inversion                              |                 | linguisticprobing                            | Classification      |\n| 406 | linguisticprobing/top_constituents                                   | tasksource/linguisticprobing                 | top_constituents                                    |                 | linguisticprobing                            | Classification      |\n| 407 | linguisticprobing/bigram_shift                                       | tasksource/linguisticprobing                 | bigram_shift                                        |                 | linguisticprobing                            | Classification      |\n| 408 | linguisticprobing/odd_man_out                                        | tasksource/linguisticprobing                 | odd_man_out                                         |                 | linguisticprobing                            | Classification      |\n| 409 | linguisticprobing/subj_number                                        | tasksource/linguisticprobing                 | subj_number                                         |                 | linguisticprobing                            | Classification      |\n| 410 | linguisticprobing/tree_depth                                         | tasksource/linguisticprobing                 | tree_depth                                          |                 | linguisticprobing                            | Classification      |\n| 411 | linguisticprobing/obj_number                                         | tasksource/linguisticprobing                 | obj_number                                          |                 | linguisticprobing                            | Classification      |\n| 412 | linguisticprobing/past_present                                       | tasksource/linguisticprobing                 | past_present                                        |                 | linguisticprobing                            | Classification      |\n| 413 | linguisticprobing/sentence_length                                    | tasksource/linguisticprobing                 | sentence_length                                     |                 | linguisticprobing                            | Classification      |\n| 414 | crowdflower/airline-sentiment                                        | tasksource/crowdflower                       | airline-sentiment                                   |                 | crowdflower                                  | Classification      |\n| 415 | crowdflower/political-media-bias                                     | tasksource/crowdflower                       | political-media-bias                                |                 | crowdflower                                  | Classification      |\n| 416 | crowdflower/political-media-message                                  | tasksource/crowdflower                       | political-media-message                             |                 | crowdflower                                  | Classification      |\n| 417 | crowdflower/text_emotion                                             | tasksource/crowdflower                       | text_emotion                                        |                 | crowdflower                                  | Classification      |\n| 418 | crowdflower/economic-news                                            | tasksource/crowdflower                       | economic-news                                       |                 | crowdflower                                  | Classification      |\n| 419 | crowdflower/political-media-audience                                 | tasksource/crowdflower                       | political-media-audience                            |                 | crowdflower                                  | Classification      |\n| 420 | crowdflower/corporate-messaging                                      | tasksource/crowdflower                       | corporate-messaging                                 |                 | crowdflower                                  | Classification      |\n| 421 | crowdflower/tweet_global_warming                                     | tasksource/crowdflower                       | tweet_global_warming                                |                 | crowdflower                                  | Classification      |\n| 422 | crowdflower/sentiment_nuclear_power                                  | tasksource/crowdflower                       | sentiment_nuclear_power                             |                 | crowdflower                                  | Classification      |\n| 423 | ethics/commonsense                                                   | metaeval/ethics                              | commonsense                                         |                 | ethics___commonsense                         | Classification      |\n| 424 | ethics/deontology                                                    | metaeval/ethics                              | deontology                                          |                 | ethics___deontology                          | Classification      |\n| 425 | ethics/justice                                                       | metaeval/ethics                              | justice                                             |                 | ethics___justice                             | Classification      |\n| 426 | ethics/virtue                                                        | metaeval/ethics                              | virtue                                              |                 | ethics___virtue                              | Classification      |\n| 427 | emo/emo2019                                                          | emo                                          | emo2019                                             |                 | emo                                          | Classification      |\n| 428 | google_wellformed_query                                              | google_wellformed_query                      |                                                     |                 | google_wellformed_query                      | Classification      |\n| 429 | tweets_hate_speech_detection                                         | tweets_hate_speech_detection                 |                                                     |                 | tweets_hate_speech_detection                 | Classification      |\n| 430 | has_part                                                             | has_part                                     |                                                     |                 | has_part                                     | Classification      |\n| 431 | wnut_17/wnut_17                                                      | wnut_17                                      | wnut_17                                             |                 | wnut_17                                      | TokenClassification |\n| 432 | ncbi_disease/ncbi_disease                                            | ncbi_disease                                 | ncbi_disease                                        |                 | ncbi_disease                                 | TokenClassification |\n| 433 | acronym_identification                                               | acronym_identification                       |                                                     |                 | acronym_identification                       | TokenClassification |\n| 434 | jnlpba/jnlpba                                                        | jnlpba                                       | jnlpba                                              |                 | jnlpba                                       | TokenClassification |\n| 435 | ontonotes_english/SpeedOfMagic--ontonotes_english                    | SpeedOfMagic/ontonotes_english               | SpeedOfMagic--ontonotes_english                     |                 | SpeedOfMagic_ontonotes_english               | TokenClassification |\n| 436 | blog_authorship_corpus/gender                                        | blog_authorship_corpus                       |                                                     | gender          | blog_authorship_corpus__gender               | Classification      |\n| 437 | blog_authorship_corpus/age                                           | blog_authorship_corpus                       |                                                     | age             | blog_authorship_corpus__age                  | Classification      |\n| 438 | blog_authorship_corpus/job                                           | blog_authorship_corpus                       |                                                     | job             | blog_authorship_corpus__job                  | Classification      |\n| 439 | open_question_type                                                   | launch/open_question_type                    |                                                     |                 | launch_open_question_type                    | Classification      |\n| 440 | health_fact                                                          | health_fact                                  |                                                     |                 | health_fact                                  | Classification      |\n| 441 | commonsense_qa                                                       | commonsense_qa                               |                                                     |                 | commonsense_qa                               | MultipleChoice      |\n| 442 | mc_taco                                                              | mc_taco                                      |                                                     |                 | mc_taco                                      | Classification      |\n| 443 | ade_corpus_v2/Ade_corpus_v2_classification                           | ade_corpus_v2                                | Ade_corpus_v2_classification                        |                 | ade_corpus_v2___Ade_corpus_v2_classification | Classification      |\n| 444 | discosense                                                           | prajjwal1/discosense                         |                                                     |                 | discosense                                   | MultipleChoice      |\n| 445 | circa                                                                | circa                                        |                                                     |                 | circa                                        | Classification      |\n| 446 | phrase_similarity                                                    | PiC/phrase_similarity                        |                                                     |                 | phrase_similarity                            | Classification      |\n| 447 | scientific-exaggeration-detection                                    | copenlu/scientific-exaggeration-detection    |                                                     |                 | exaggeration_detection                       | Classification      |\n| 448 | quarel                                                               | quarel                                       |                                                     |                 | quarel                                       | Classification      |\n| 449 | fever-evidence-related                                               | mwong/fever-evidence-related                 |                                                     |                 | mwong_fever_evidence_related                 | Classification      |\n| 450 | numer_sense                                                          | numer_sense                                  |                                                     |                 | numer_sense                                  | Classification      |\n| 451 | dynasent/dynabench.dynasent.r1.all/r1                                | dynabench/dynasent                           | dynabench.dynasent.r1.all                           | r1              | dynasent__r1                                 | Classification      |\n| 452 | dynasent/dynabench.dynasent.r2.all/r2                                | dynabench/dynasent                           | dynabench.dynasent.r2.all                           | r2              | dynasent__r2                                 | Classification      |\n| 453 | Sarcasm_News_Headline                                                | raquiba/Sarcasm_News_Headline                |                                                     |                 | sarcasm_news                                 | Classification      |\n| 454 | sem_eval_2010_task_8                                                 | sem_eval_2010_task_8                         |                                                     |                 | sem_eval_2010_task_8                         | Classification      |\n| 455 | auditor_review                                                       | demo-org/auditor_review                      |                                                     |                 | auditor_review                               | Classification      |\n| 456 | medmcqa                                                              | medmcqa                                      |                                                     |                 | medmcqa                                      | MultipleChoice      |\n| 457 | Dynasent_Disagreement                                                | RuyuanWan/Dynasent_Disagreement              |                                                     |                 | dynasent_disagreement                        | Classification      |\n| 458 | Politeness_Disagreement                                              | RuyuanWan/Politeness_Disagreement            |                                                     |                 | politeness_disagreement                      | Classification      |\n| 459 | SBIC_Disagreement                                                    | RuyuanWan/SBIC_Disagreement                  |                                                     |                 | sbic_disagreement                            | Classification      |\n| 460 | SChem_Disagreement                                                   | RuyuanWan/SChem_Disagreement                 |                                                     |                 | schem_disagreement                           | Classification      |\n| 461 | Dilemmas_Disagreement                                                | RuyuanWan/Dilemmas_Disagreement              |                                                     |                 | dilemmas_disagreement                        | Classification      |\n| 462 | logiqa                                                               | lucasmccabe/logiqa                           |                                                     |                 | logiqa                                       | MultipleChoice      |\n| 463 | wiki_qa                                                              | wiki_qa                                      |                                                     |                 | wiki_qa                                      | Classification      |\n| 464 | cycic_classification                                                 | tasksource/cycic_classification              |                                                     |                 | cycic_classification                         | Classification      |\n| 465 | cycic_multiplechoice                                                 | tasksource/cycic_multiplechoice              |                                                     |                 | cycic_mc                                     | MultipleChoice      |\n| 466 | sts-companion                                                        | tasksource/sts-companion                     |                                                     |                 | sts_companion                                | Classification      |\n| 467 | commonsense_qa_2.0                                                   | tasksource/commonsense_qa_2.0                |                                                     |                 | commonsense_qa_2                             | Classification      |\n| 468 | lingnli                                                              | tasksource/lingnli                           |                                                     |                 | ling_nli                                     | Classification      |\n| 469 | monotonicity-entailment                                              | tasksource/monotonicity-entailment           |                                                     |                 | monotonicity_entailment                      | Classification      |\n| 470 | arct                                                                 | tasksource/arct                              |                                                     |                 | arct                                         | MultipleChoice      |\n| 471 | scinli                                                               | tasksource/scinli                            |                                                     |                 | scinli                                       | Classification      |\n| 472 | naturallogic                                                         | tasksource/naturallogic                      |                                                     |                 | naturallogic                                 | Classification      |\n| 473 | onestop_qa                                                           | onestop_qa                                   |                                                     |                 | onestop_qa                                   | MultipleChoice      |\n| 474 | moral_stories/full                                                   | demelin/moral_stories                        | full                                                |                 | moral_stories                                | MultipleChoice      |\n| 475 | prost                                                                | corypaik/prost                               |                                                     |                 | prost                                        | MultipleChoice      |\n| 476 | dynahate                                                             | aps/dynahate                                 |                                                     |                 | dyna_hate                                    | Classification      |\n| 477 | syntactic-augmentation-nli                                           | metaeval/syntactic-augmentation-nli          |                                                     |                 | syntactic_augmentation_nli                   | Classification      |\n| 478 | autotnli                                                             | tasksource/autotnli                          |                                                     |                 | autotnli                                     | Classification      |\n| 479 | CONDAQA                                                              | lasha-nlp/CONDAQA                            |                                                     |                 | conqada                                      | Classification      |\n| 480 | webgpt_comparisons                                                   | openai/webgpt_comparisons                    |                                                     |                 | webgbpt_comparisons                          | MultipleChoice      |\n| 481 | synthetic-instruct-gptj-pairwise                                     | Dahoas/synthetic-instruct-gptj-pairwise      |                                                     |                 | synthetic_instruct                           | MultipleChoice      |\n| 482 | scruples                                                             | metaeval/scruples                            |                                                     |                 | scruples                                     | Classification      |\n| 483 | wouldyourather                                                       | metaeval/wouldyourather                      |                                                     |                 | wouldyourather                               | MultipleChoice      |\n| 484 | defeasible-nli/snli                                                  | metaeval/defeasible-nli                      | snli                                                |                 | defeasible_nli                               | Classification      |\n| 485 | defeasible-nli/atomic                                                | metaeval/defeasible-nli                      | atomic                                              |                 | defeasible_nli                               | Classification      |\n| 486 | help-nli                                                             | tasksource/help-nli                          |                                                     |                 | help_nli                                     | Classification      |\n| 487 | nli-veridicality-transitivity                                        | metaeval/nli-veridicality-transitivity       |                                                     |                 | nli_veridicality_transitivity                | Classification      |\n| 488 | lonli                                                                | tasksource/lonli                             |                                                     |                 | lonli                                        | Classification      |\n| 489 | dadc-limit-nli                                                       | tasksource/dadc-limit-nli                    |                                                     |                 | dadc_limit                                   | Classification      |\n| 490 | FLUTE                                                                | ColumbiaNLP/FLUTE                            |                                                     |                 | flute                                        | Classification      |\n| 491 | strategy-qa                                                          | tasksource/strategy-qa                       |                                                     |                 | strategy_qa                                  | Classification      |\n| 492 | summarize_from_feedback/comparisons                                  | openai/summarize_from_feedback               | comparisons                                         |                 | summarize_from_feedback                      | MultipleChoice      |\n| 493 | folio                                                                | tasksource/folio                             |                                                     |                 | folio                                        | Classification      |\n| 494 | tomi-nli                                                             | tasksource/tomi-nli                          |                                                     |                 | tomi_nli                                     | Classification      |\n| 495 | avicenna                                                             | tasksource/avicenna                          |                                                     |                 | avicenna                                     | Classification      |\n| 496 | SHP                                                                  | stanfordnlp/SHP                              |                                                     |                 | shp                                          | MultipleChoice      |\n| 497 | MedQA-USMLE-4-options-hf                                             | GBaker/MedQA-USMLE-4-options-hf              |                                                     |                 | medqa_usmle                                  | MultipleChoice      |\n| 498 | wikimedqa/medwiki                                                    | sileod/wikimedqa                             | medwiki                                             |                 | wikimedqa                                    | MultipleChoice      |\n| 499 | cicero                                                               | declare-lab/cicero                           |                                                     |                 | cicero                                       | MultipleChoice      |\n| 500 | CREAK                                                                | amydeng2000/CREAK                            |                                                     |                 | creak                                        | Classification      |\n| 501 | mutual                                                               | tasksource/mutual                            |                                                     |                 | mutual                                       | MultipleChoice      |\n| 502 | NeQA                                                                 | inverse-scaling/NeQA                         |                                                     |                 | neqa                                         | MultipleChoice      |\n| 503 | quote-repetition                                                     | inverse-scaling/quote-repetition             |                                                     |                 | quote_repetition                             | MultipleChoice      |\n| 504 | redefine-math                                                        | inverse-scaling/redefine-math                |                                                     |                 | redefine_math                                | MultipleChoice      |\n| 505 | puzzte                                                               | tasksource/puzzte                            |                                                     |                 | puzzte                                       | Classification      |\n| 506 | implicatures                                                         | tasksource/implicatures                      |                                                     |                 | implicatures                                 | MultipleChoice      |\n| 507 | race/middle                                                          | race                                         | middle                                              |                 | race                                         | MultipleChoice      |\n| 508 | race/high                                                            | race                                         | high                                                |                 | race                                         | MultipleChoice      |\n| 509 | race-c                                                               | tasksource/race-c                            |                                                     |                 | race_c                                       | MultipleChoice      |\n| 510 | spartqa-yn                                                           | tasksource/spartqa-yn                        |                                                     |                 | spartqa_yn                                   | Classification      |\n| 511 | spartqa-mchoice                                                      | tasksource/spartqa-mchoice                   |                                                     |                 | spartqa_mc                                   | MultipleChoice      |\n| 512 | temporal-nli                                                         | tasksource/temporal-nli                      |                                                     |                 | temporal_nli                                 | Classification      |\n| 513 | riddle_sense                                                         | riddle_sense                                 |                                                     |                 | riddle_sense                                 | MultipleChoice      |\n| 514 | clcd-english                                                         | tasksource/clcd-english                      |                                                     |                 | clcd                                         | Classification      |\n| 515 | twentyquestions                                                      | maximedb/twentyquestions                     |                                                     |                 | twentyquestions                              | Classification      |\n| 516 | reclor                                                               | metaeval/reclor                              |                                                     |                 | reclor                                       | MultipleChoice      |\n| 517 | counterfactually-augmented-imdb                                      | tasksource/counterfactually-augmented-imdb   |                                                     |                 | c_aug_imdb                                   | Classification      |\n| 518 | counterfactually-augmented-snli                                      | tasksource/counterfactually-augmented-snli   |                                                     |                 | c_aug_snli                                   | Classification      |\n| 519 | cnli                                                                 | metaeval/cnli                                |                                                     |                 | cnli                                         | Classification      |\n| 520 | boolq-natural-perturbations                                          | tasksource/boolq-natural-perturbations       |                                                     |                 | perturbed_boolq                              | Classification      |\n| 521 | acceptability-prediction                                             | metaeval/acceptability-prediction            |                                                     |                 | graded_acceptability                         | Classification      |\n| 522 | equate                                                               | metaeval/equate                              |                                                     |                 | equate                                       | Classification      |\n| 523 | ScienceQA_text_only                                                  | tasksource/ScienceQA_text_only               |                                                     |                 | science_qa                                   | MultipleChoice      |\n| 524 | ekar_english                                                         | Jiangjie/ekar_english                        |                                                     |                 | ekar                                         | MultipleChoice      |\n| 525 | implicit-hate-stg1                                                   | tasksource/implicit-hate-stg1                |                                                     |                 | implicit_hate                                | Classification      |\n| 526 | chaos-mnli-ambiguity                                                 | metaeval/chaos-mnli-ambiguity                |                                                     |                 | nli_unambiguity                              | Classification      |\n| 527 | headline_cause/en_simple                                             | IlyaGusev/headline_cause                     | en_simple                                           |                 | headline_cause                               | Classification      |\n| 528 | logiqa-2.0-nli                                                       | tasksource/logiqa-2.0-nli                    |                                                     |                 | logiqa_2                                     | Classification      |\n| 529 | oasst2_dense_flat/quality                                            | tasksource/oasst2_dense_flat                 |                                                     | quality         | oasst1__quality                              | Classification      |\n| 530 | oasst2_dense_flat/toxicity                                           | tasksource/oasst2_dense_flat                 |                                                     | toxicity        | oasst1__toxicity                             | Classification      |\n| 531 | oasst2_dense_flat/helpfulness                                        | tasksource/oasst2_dense_flat                 |                                                     | helpfulness     | oasst1__helpfulness                          | Classification      |\n| 532 | mindgames                                                            | sileod/mindgames                             |                                                     |                 | mindgames                                    | Classification      |\n| 533 | universal_dependencies/en_lines/deprel                               | universal_dependencies                       | en_lines                                            | deprel          | udep__deprel                                 | TokenClassification |\n| 534 | universal_dependencies/en_gum/deprel                                 | universal_dependencies                       | en_gum                                              | deprel          | udep__deprel                                 | TokenClassification |\n| 535 | universal_dependencies/en_partut/deprel                              | universal_dependencies                       | en_partut                                           | deprel          | udep__deprel                                 | TokenClassification |\n| 536 | universal_dependencies/en_ewt/deprel                                 | universal_dependencies                       | en_ewt                                              | deprel          | udep__deprel                                 | TokenClassification |\n| 537 | ambient                                                              | metaeval/ambient                             |                                                     |                 | ambient                                      | Classification      |\n| 538 | path-naturalness-prediction                                          | metaeval/path-naturalness-prediction         |                                                     |                 | path_naturalness                             | MultipleChoice      |\n| 539 | civil_comments/toxicity                                              | civil_comments                               |                                                     | toxicity        | civil_comments__toxicity                     | Classification      |\n| 540 | civil_comments/severe_toxicity                                       | civil_comments                               |                                                     | severe_toxicity | civil_comments__severe_toxicity              | Classification      |\n| 541 | civil_comments/obscene                                               | civil_comments                               |                                                     | obscene         | civil_comments__obscene                      | Classification      |\n| 542 | civil_comments/threat                                                | civil_comments                               |                                                     | threat          | civil_comments__threat                       | Classification      |\n| 543 | civil_comments/insult                                                | civil_comments                               |                                                     | insult          | civil_comments__insult                       | Classification      |\n| 544 | civil_comments/identity_attack                                       | civil_comments                               |                                                     | identity_attack | civil_comments__identity_attack              | Classification      |\n| 545 | civil_comments/sexual_explicit                                       | civil_comments                               |                                                     | sexual_explicit | civil_comments__sexual_explicit              | Classification      |\n| 546 | cloth                                                                | AndyChiang/cloth                             |                                                     |                 | cloth                                        | MultipleChoice      |\n| 547 | dgen                                                                 | AndyChiang/dgen                              |                                                     |                 | dgen                                         | MultipleChoice      |\n| 548 | I2D2                                                                 | tasksource/I2D2                              |                                                     |                 | i2d2                                         | Classification      |\n| 549 | args_me                                                              | webis/args_me                                |                                                     |                 | arg_me                                       | Classification      |\n| 550 | Touche23-ValueEval                                                   | webis/Touche23-ValueEval                     |                                                     |                 | valueeval_stance                             | Classification      |\n| 551 | starcon                                                              | tasksource/starcon                           |                                                     |                 | starcon                                      | Classification      |\n| 552 | banking77                                                            | PolyAI/banking77                             |                                                     |                 | banking77                                    | Classification      |\n| 553 | ConTRoL-nli                                                          | tasksource/ConTRoL-nli                       |                                                     |                 | control                                      | Classification      |\n| 554 | tracie                                                               | tasksource/tracie                            |                                                     |                 | tracie                                       | Classification      |\n| 555 | sherliic                                                             | tasksource/sherliic                          |                                                     |                 | sherliic                                     | Classification      |\n| 556 | sen-making/1                                                         | tasksource/sen-making                        |                                                     | 1               | sen_making__1                                | MultipleChoice      |\n| 557 | sen-making/2                                                         | tasksource/sen-making                        |                                                     | 2               | sen_making__2                                | MultipleChoice      |\n| 558 | winowhy                                                              | tasksource/winowhy                           |                                                     |                 | winowhy                                      | Classification      |\n| 559 | robustLR                                                             | tasksource/robustLR                          |                                                     |                 | robustLR                                     | Classification      |\n| 560 | v1/gen_train234_test2to10                                            | CLUTRR/v1                                    | gen_train234_test2to10                              |                 | cluttr                                       | Classification      |\n| 561 | logical-fallacy                                                      | tasksource/logical-fallacy                   |                                                     |                 | logical_fallacy                              | Classification      |\n| 562 | parade                                                               | tasksource/parade                            |                                                     |                 | parade                                       | Classification      |\n| 563 | cladder                                                              | tasksource/cladder                           |                                                     |                 | cladder                                      | Classification      |\n| 564 | subjectivity                                                         | tasksource/subjectivity                      |                                                     |                 | subjectivity                                 | Classification      |\n| 565 | MOH                                                                  | tasksource/MOH                               |                                                     |                 | moh                                          | Classification      |\n| 566 | VUAC                                                                 | tasksource/VUAC                              |                                                     |                 | vuac                                         | Classification      |\n| 567 | TroFi                                                                | tasksource/TroFi                             |                                                     |                 | trofi                                        | Classification      |\n| 568 | sharc_modified/mod                                                   | sharc_modified                               | mod                                                 |                 | sharc_classification                         | Classification      |\n| 569 | conceptrules_v2                                                      | tasksource/conceptrules_v2                   |                                                     |                 | conceptrules_v2                              | Classification      |\n| 570 | disrpt/eng.dep.scidtb.rels                                           | metaeval/disrpt                              | eng.dep.scidtb.rels                                 |                 | scidtb                                       | Classification      |\n| 571 | conll2000                                                            | conll2000                                    |                                                     |                 | chunking                                     | TokenClassification |\n| 572 | few-nerd/supervised                                                  | DFKI-SLT/few-nerd                            | supervised                                          |                 | few_nerd                                     | TokenClassification |\n| 573 | finer-139                                                            | nlpaueb/finer-139                            |                                                     |                 | finer                                        | TokenClassification |\n| 574 | zero-shot-label-nli                                                  | tasksource/zero-shot-label-nli               |                                                     |                 | label_nli                                    | Classification      |\n| 575 | com2sense                                                            | tasksource/com2sense                         |                                                     |                 | com2sense                                    | Classification      |\n| 576 | scone                                                                | tasksource/scone                             |                                                     |                 | scone                                        | Classification      |\n| 577 | winodict                                                             | tasksource/winodict                          |                                                     |                 | winodict                                     | MultipleChoice      |\n| 578 | fool-me-twice                                                        | tasksource/fool-me-twice                     |                                                     |                 | fool_me_twice                                | Classification      |\n| 579 | monli                                                                | tasksource/monli                             |                                                     |                 | monli                                        | Classification      |\n| 580 | corr2cause                                                           | tasksource/corr2cause                        |                                                     |                 | causality                                    | Classification      |\n| 581 | lsat_qa/all                                                          | lighteval/lsat_qa                            | all                                                 |                 | lsat                                         | MultipleChoice      |\n| 582 | apt                                                                  | tasksource/apt                               |                                                     |                 | apt                                          | Classification      |\n| 583 | twitter-financial-news-sentiment                                     | zeroshot/twitter-financial-news-sentiment    |                                                     |                 | financial_sentiment                          | Classification      |\n| 584 | icl-symbol-tuning-instruct                                           | tasksource/icl-symbol-tuning-instruct        |                                                     |                 | icl                                          | Classification      |\n| 585 | SpaceNLI                                                             | tasksource/SpaceNLI                          |                                                     |                 | space_nli                                    | Classification      |\n| 586 | propsegment/nli                                                      | sihaochen/propsegment                        | nli                                                 |                 | propsegment                                  | Classification      |\n| 587 | HatemojiBuild                                                        | HannahRoseKirk/HatemojiBuild                 |                                                     |                 | hatemoji                                     | Classification      |\n| 588 | regset                                                               | tasksource/regset                            |                                                     |                 | regset                                       | Classification      |\n| 589 | esci                                                                 | tasksource/esci                              |                                                     |                 | esci                                         | Classification      |\n| 590 | chatbot_arena_conversations                                          | lmsys/chatbot_arena_conversations            |                                                     |                 | chatbot_arena                                | MultipleChoice      |\n| 591 | dnd_style_intents                                                    | neurae/dnd_style_intents                     |                                                     |                 | dnd_intent                                   | Classification      |\n| 592 | FLD.v2/default                                                       | hitachi-nlp/FLD.v2                           | default                                             |                 | fld                                          | Classification      |\n| 593 | FLD.v2/star                                                          | hitachi-nlp/FLD.v2                           | star                                                |                 | flds                                         | Classification      |\n| 594 | SDOH-NLI                                                             | tasksource/SDOH-NLI                          |                                                     |                 | sdoh_nli                                     | Classification      |\n| 595 | scifact_entailment                                                   | allenai/scifact_entailment                   |                                                     |                 | scifact_entailment                           | Classification      |\n| 596 | feasibilityQA                                                        | tasksource/feasibilityQA                     |                                                     |                 | feasibilityQA                                | Classification      |\n| 597 | simple_pair                                                          | tasksource/simple_pair                       |                                                     |                 | simple_pair                                  | Classification      |\n| 598 | AdjectiveScaleProbe-nli                                              | tasksource/AdjectiveScaleProbe-nli           |                                                     |                 | adjective_scale_probe                        | Classification      |\n| 599 | resnli                                                               | tasksource/resnli                            |                                                     |                 | repectively_nli                              | Classification      |\n| 600 | SpaRTUN                                                              | tasksource/SpaRTUN                           |                                                     |                 | spartun                                      | MultipleChoice      |\n| 601 | ReSQ                                                                 | tasksource/ReSQ                              |                                                     |                 | resq                                         | MultipleChoice      |\n| 602 | semantic_fragments_nli                                               | tasksource/semantic_fragments_nli            |                                                     |                 | semantic_fragments_nli                       | Classification      |\n| 603 | dataset_train_nli                                                    | MoritzLaurer/dataset_train_nli               |                                                     |                 | moritz_zs_nli                                | Classification      |\n| 604 | stepgame                                                             | tasksource/stepgame                          |                                                     |                 | stepgame                                     | Classification      |\n| 605 | nlgraph                                                              | tasksource/nlgraph                           |                                                     |                 | nlgraph                                      | Classification      |\n| 606 | oasst2_pairwise_rlhf_reward                                          | tasksource/oasst2_pairwise_rlhf_reward       |                                                     |                 | oasst_rlhf                                   | MultipleChoice      |\n| 607 | hh-rlhf/helpful-rejection-sampled                                    | tasksource/hh-rlhf                           | helpful-rejection-sampled                           |                 | anthropic_rlhf_helpfulness                   | MultipleChoice      |\n| 608 | hh-rlhf/helpful-online                                               | tasksource/hh-rlhf                           | helpful-online                                      |                 | anthropic_rlhf_helpfulness                   | MultipleChoice      |\n| 609 | hh-rlhf/helpful-base                                                 | tasksource/hh-rlhf                           | helpful-base                                        |                 | anthropic_rlhf_helpfulness                   | MultipleChoice      |\n| 610 | hh-rlhf/harmless-base                                                | tasksource/hh-rlhf                           | harmless-base                                       |                 | anthropic_rlhf_harmless                      | MultipleChoice      |\n| 611 | ruletaker                                                            | tasksource/ruletaker                         |                                                     |                 | ruletaker                                    | Classification      |\n| 612 | PARARULE-Plus                                                        | qbao775/PARARULE-Plus                        |                                                     |                 | para_rules                                   | Classification      |\n| 613 | proofwriter                                                          | tasksource/proofwriter                       |                                                     |                 | proofwriter_deduction                        | Classification      |\n| 614 | logical-entailment                                                   | tasksource/logical-entailment                |                                                     |                 | logical_entailment                           | Classification      |\n| 615 | nope                                                                 | tasksource/nope                              |                                                     |                 | nope                                         | Classification      |\n| 616 | LogicNLI                                                             | tasksource/LogicNLI                          |                                                     |                 | logicNLI                                     | Classification      |\n| 617 | contract-nli/contractnli_a/seg                                       | kiddothe2b/contract-nli                      | contractnli_a                                       | seg             | contract_nli__seg                            | Classification      |\n| 618 | contract-nli/contractnli_b/full                                      | kiddothe2b/contract-nli                      | contractnli_b                                       | full            | contract_nli__full                           | Classification      |\n| 619 | nli4ct_semeval2024                                                   | AshtonIsNotHere/nli4ct_semeval2024           |                                                     |                 | nli4ct                                       | Classification      |\n| 620 | lsat-ar                                                              | tasksource/lsat-ar                           |                                                     |                 | lsat_ar                                      | MultipleChoice      |\n| 621 | lsat-rc                                                              | tasksource/lsat-rc                           |                                                     |                 | lsat_rc                                      | MultipleChoice      |\n| 622 | biosift-nli                                                          | AshtonIsNotHere/biosift-nli                  |                                                     |                 | biosift_nli                                  | Classification      |\n| 623 | brainteasers/SP                                                      | tasksource/brainteasers                      | SP                                                  |                 | brainteasers                                 | MultipleChoice      |\n| 624 | brainteasers/WP                                                      | tasksource/brainteasers                      | WP                                                  |                 | brainteasers                                 | MultipleChoice      |\n| 625 | persuasion                                                           | Anthropic/persuasion                         |                                                     |                 | persuasiveness                               | Classification      |\n| 626 | AmbigNQ-clarifying-question                                          | erbacher/AmbigNQ-clarifying-question         |                                                     |                 | ambigNQ                                      | Classification      |\n| 627 | SIGA-nli                                                             | tasksource/SIGA-nli                          |                                                     |                 | siga_nli                                     | Classification      |\n| 628 | FOL-nli                                                              | unigram/FOL-nli                              |                                                     |                 | unigram_fol                                  | Classification      |\n| 629 | goal-step-wikihow/order                                              | tasksource/goal-step-wikihow                 | order                                               |                 | gs_order                                     | MultipleChoice      |\n| 630 | PARADISE                                                             | GGLab/PARADISE                               |                                                     |                 | paradise                                     | MultipleChoice      |\n| 631 | doc-nli                                                              | tasksource/doc-nli                           |                                                     |                 | docnli                                       | Classification      |\n| 632 | mctest-nli                                                           | tasksource/mctest-nli                        |                                                     |                 | mctest_nli                                   | Classification      |\n| 633 | patent-phrase-similarity                                             | tasksource/patent-phrase-similarity          |                                                     |                 | patent_phrase_similarity                     | Classification      |\n| 634 | natural-language-satisfiability                                      | tasksource/natural-language-satisfiability   |                                                     |                 | nlsat                                        | Classification      |\n| 635 | idioms-nli                                                           | tasksource/idioms-nli                        |                                                     |                 | idioms_nli                                   | Classification      |\n| 636 | lifecycle-entailment                                                 | tasksource/lifecycle-entailment              |                                                     |                 | lifeycle_entailment                          | Classification      |\n| 637 | HelpSteer/helpfulness                                                | nvidia/HelpSteer                             |                                                     | helpfulness     | helpsteer__helpfulness                       | Classification      |\n| 638 | HelpSteer/correctness                                                | nvidia/HelpSteer                             |                                                     | correctness     | helpsteer__correctness                       | Classification      |\n| 639 | HelpSteer/coherence                                                  | nvidia/HelpSteer                             |                                                     | coherence       | helpsteer__coherence                         | Classification      |\n| 640 | HelpSteer/complexity                                                 | nvidia/HelpSteer                             |                                                     | complexity      | helpsteer__complexity                        | Classification      |\n| 641 | HelpSteer/verbosity                                                  | nvidia/HelpSteer                             |                                                     | verbosity       | helpsteer__verbosity                         | Classification      |\n| 642 | HelpSteer2/helpfulness                                               | nvidia/HelpSteer2                            |                                                     | helpfulness     | helpsteer_2__helpfulness                     | Classification      |\n| 643 | HelpSteer2/correctness                                               | nvidia/HelpSteer2                            |                                                     | correctness     | helpsteer_2__correctness                     | Classification      |\n| 644 | HelpSteer2/coherence                                                 | nvidia/HelpSteer2                            |                                                     | coherence       | helpsteer_2__coherence                       | Classification      |\n| 645 | HelpSteer2/complexity                                                | nvidia/HelpSteer2                            |                                                     | complexity      | helpsteer_2__complexity                      | Classification      |\n| 646 | HelpSteer2/verbosity                                                 | nvidia/HelpSteer2                            |                                                     | verbosity       | helpsteer_2__verbosity                       | Classification      |\n| 647 | MSciNLI                                                              | sadat2307/MSciNLI                            |                                                     |                 | msci_nli                                     | Classification      |\n| 648 | UltraFeedback-paired                                                 | pushpdeep/UltraFeedback-paired               |                                                     |                 | ultrafeedback                                | MultipleChoice      |\n| 649 | AES2-essay-scoring                                                   | tasksource/AES2-essay-scoring                |                                                     |                 | essay_scoring                                | Classification      |\n| 650 | english-grading/cohesion                                             | tasksource/english-grading                   |                                                     | cohesion        | grading__cohesion                            | Classification      |\n| 651 | english-grading/syntax                                               | tasksource/english-grading                   |                                                     | syntax          | grading__syntax                              | Classification      |\n| 652 | english-grading/vocabulary                                           | tasksource/english-grading                   |                                                     | vocabulary      | grading__vocabulary                          | Classification      |\n| 653 | english-grading/phraseology                                          | tasksource/english-grading                   |                                                     | phraseology     | grading__phraseology                         | Classification      |\n| 654 | english-grading/grammar                                              | tasksource/english-grading                   |                                                     | grammar         | grading__grammar                             | Classification      |\n| 655 | english-grading/conventions                                          | tasksource/english-grading                   |                                                     | conventions     | grading__conventions                         | Classification      |\n| 656 | wice                                                                 | tasksource/wice                              |                                                     |                 | wice                                         | Classification      |\n| 657 | hover                                                                | Dzeniks/hover                                |                                                     |                 | hover                                        | Classification      |\n| 658 | hover-3way/nli                                                       | Dzeniks/hover-3way                           |                                                     | nli             | hover__nli                                   | Classification      |\n| 659 | tasksource_dpo_pairs                                                 | tasksource/tasksource_dpo_pairs              |                                                     |                 | tasksource_dpo                               | MultipleChoice      |\n| 660 | seahorse_summarization_evaluation                                    | tasksource/seahorse_summarization_evaluation |                                                     |                 | seahorse                                     | Classification      |\n| 661 | missing-item-prediction/contrastive                                  | sileod/missing-item-prediction               | contrastive                                         |                 | mip                                          | Classification      |\n| 662 | jigsaw_toxicity                                                      | tasksource/jigsaw_toxicity                   |                                                     |                 | jigsaw_toxicity                              | Classification      |\n| 663 | Pol_NLI                                                              | mlburnham/Pol_NLI                            |                                                     |                 | pol_nli                                      | Classification      |\n| 664 | synthetic-retrieval-NLI/count                                        | tasksource/synthetic-retrieval-NLI           | count                                               |                 | synthetic_retrieval_nli                      | Classification      |\n| 665 | synthetic-retrieval-NLI/position                                     | tasksource/synthetic-retrieval-NLI           | position                                            |                 | synthetic_retrieval_nli                      | Classification      |\n| 666 | synthetic-retrieval-NLI/binary                                       | tasksource/synthetic-retrieval-NLI           | binary                                              |                 | synthetic_retrieval_nli                      | Classification      |\n"
  }
]